URL https://opencores.org/ocsvn/neorv32/neorv32/trunk

Subversion Repositories neorv32

[/] [neorv32/] [trunk/] [sw/] [example/] [floating_point_test/] [neorv32_zfinx_extension_intrinsics.h] - Blame information for rev 74

Details | Compare with Previous | View Log


// #################################################################################################
// # << NEORV32 - Intrinsics + Emulation Functions for the RISC-V "Zfinx" CPU extension >>         #
// # ********************************************************************************************* #
// # The intrinsics provided by this library allow to use the hardware floating-point unit of the  #
// # RISC-V Zfinx CPU extension without the need for Zfinx support by the compiler / toolchain.    #
// # ********************************************************************************************* #
// # BSD 3-Clause License                                                                          #
// #                                                                                               #
// # Copyright (c) 2022, Stephan Nolting. All rights reserved.                                     #
// #                                                                                               #
// # Redistribution and use in source and binary forms, with or without modification, are          #
// # permitted provided that the following conditions are met:                                     #
// #                                                                                               #
// # 1. Redistributions of source code must retain the above copyright notice, this list of        #
// #    conditions and the following disclaimer.                                                   #
// #                                                                                               #
// # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #
// #    conditions and the following disclaimer in the documentation and/or other materials        #
// #    provided with the distribution.                                                            #
// #                                                                                               #
// # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #
// #    endorse or promote products derived from this software without specific prior written      #
// #    permission.                                                                                #
// #                                                                                               #
// # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #
// # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #
// # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #
// # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #
// # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #
// # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #
// # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #
// # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #
// # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #
// # ********************************************************************************************* #
// # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #
// #################################################################################################
 
 
/**********************************************************************//**
 * @file floating_point_test/neorv32_zfinx_extension_intrinsics.h
 * @author Stephan Nolting
 *
 * @brief "Intrinsic" library for the NEORV32 single-precision floating-point in x registers (Zfinx) extension
 * @brief Also provides emulation functions for all intrinsics (functionality re-built in pure software). The functionality of the emulation
 * @brief functions is based on the RISC-V floating-point spec.
 *
 * @note All operations from this library use the default GCC "round to nearest, ties to even" rounding mode.
 *
 * @warning This library is just a temporary fall-back until the Zfinx extensions are supported by the upstream RISC-V GCC port.
 **************************************************************************/
 
#ifndef neorv32_zfinx_extension_intrinsics_h
#define neorv32_zfinx_extension_intrinsics_h
 
#define __USE_GNU
 
#include <fenv.h>
//#pragma STDC FENV_ACCESS ON
 
#define _GNU_SOURCE
 
#include <float.h>
#include <math.h>
 
 
/**********************************************************************//**
 * Sanity check
 **************************************************************************/
#if defined __riscv_f || (__riscv_flen == 32)
  #error Application programs using the Zfinx intrinsic library have to be compiled WITHOUT the <F> MARCH ISA attribute!
#endif
 
 
/**********************************************************************//**
 * Custom data type to access floating-point values as native floats and in binary representation
 **************************************************************************/
typedef union
{
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
} float_conv_t;
 
 
// ################################################################################################
// Helper functions
// ################################################################################################
 
/**********************************************************************//**
 * Flush to zero if de-normal number.
 *
 * @warning Subnormal numbers are not supported yet! Flush them to zero.
 *
 * @param[in] tmp Source operand.
 * @return Result.
 **************************************************************************/
float subnormal_flush(float tmp) {
 
  float res = tmp;
 
  // flush to zero if subnormal
  if (fpclassify(tmp) == FP_SUBNORMAL) {
    if (signbit(tmp) != 0) {
      res = -0.0f;
    }
    else {
      res = +0.0f;
    }
  }
 
  return res;
}
 
 
// ################################################################################################
// Exception access
// ################################################################################################
 
/**********************************************************************//**
 * Get exception flags from fflags CSR (floating-point hardware).
 *
 * @return Floating point exception status word.
 **************************************************************************/
uint32_t get_hw_exceptions(void) {
 
  uint32_t res = neorv32_cpu_csr_read(CSR_FFLAGS);
 
  neorv32_cpu_csr_write(CSR_FFLAGS, 0); // clear status word
 
  return res;
}
 
 
/**********************************************************************//**
 * Get exception flags from C runtime (floating-point emulation).
 *
 * @warning WORK-IN-PROGRESS!
 *
 * @return Floating point exception status word.
 **************************************************************************/
uint32_t get_sw_exceptions(void) {
 
  const uint32_t FP_EXC_NV_C = 1 << 0; // invalid operation
  const uint32_t FP_EXC_DZ_C = 1 << 1; // divide by zero
  const uint32_t FP_EXC_OF_C = 1 << 2; // overflow
  const uint32_t FP_EXC_UF_C = 1 << 3; // underflow
  const uint32_t FP_EXC_NX_C = 1 << 4; // inexact
 
  int fpeRaised = fetestexcept(FE_ALL_EXCEPT);
 
  uint32_t res = 0;
 
  if (fpeRaised & FE_INVALID)   { res |= FP_EXC_NV_C; }
  if (fpeRaised & FE_DIVBYZERO) { res |= FP_EXC_DZ_C; }
  if (fpeRaised & FE_OVERFLOW)  { res |= FP_EXC_OF_C; }
  if (fpeRaised & FE_UNDERFLOW) { res |= FP_EXC_UF_C; }
  if (fpeRaised & FE_INEXACT)   { res |= FP_EXC_NX_C; }
 
  feclearexcept(FE_ALL_EXCEPT);
 
  return res;
}
 
 
// ################################################################################################
// "Intrinsics"
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point addition
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fadds(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point subtraction
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsubs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point multiplication
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmuls(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point minimum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmins(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point maximum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmaxs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert float to unsigned integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_wus(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00001, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert float to signed integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline int32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_ws(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return (int32_t)CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00000, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert unsigned integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_swu(uint32_t rs1) {
 
  float_conv_t res;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00001, rs1, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert signed integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_sw(int32_t rs1) {
 
  float_conv_t res;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00000, rs1, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_feqs(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_flts(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than-or-equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fles(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection NOT
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjns(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection XOR
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjxs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point number classification
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fclasss(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return CUSTOM_INSTR_R1_TYPE(0b1110000, 0b00000, opa.binary_value, 0b001, 0b1010011);
}
 
 
// ################################################################################################
// !!! UNSUPPORTED instructions !!!
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point division
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fdivs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point square root
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsqrts(float rs1) {
 
  float_conv_t opa, res;
  opa.float_value = rs1;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b0101100, 0b00000, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-add
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmadds(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-sub
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmsubs(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000111);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-sub
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fnmsubs(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1001011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-add
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fnmadds(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1001111);
  return res.float_value;
}
 
 
// ################################################################################################
// Emulation functions
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point addition
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fadds(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa + opb;
 
  // make NAN canonical
  if (fpclassify(res) == FP_NAN) {
    res = NAN;
  }
 
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point subtraction
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsubs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa - opb;
 
  // make NAN canonical
  if (fpclassify(res) == FP_NAN) {
    res = NAN;
  }
 
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point multiplication
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmuls(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa * opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point minimum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmins(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  union {
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
  } tmp_a, tmp_b;
 
  if ((fpclassify(opa) == FP_NAN) && (fpclassify(opb) == FP_NAN)) {
    return nanf("");
  }
 
  if (fpclassify(opa) == FP_NAN) {
    return opb;
  }
 
  if (fpclassify(opb) == FP_NAN) {
    return opa;
  }
 
  // RISC-V spec: -0 < +0
  tmp_a.float_value = opa;
  tmp_b.float_value = opb;
  if (((tmp_a.binary_value == 0x80000000) && (tmp_b.binary_value == 0x00000000)) ||
      ((tmp_a.binary_value == 0x00000000) && (tmp_b.binary_value == 0x80000000))) {
    return -0.0f;
  }
 
  return fmin(opa, opb);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point maximum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmaxs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  union {
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
  } tmp_a, tmp_b;
 
 
  if ((fpclassify(opa) == FP_NAN) && (fpclassify(opb) == FP_NAN)) {
    return nanf("");
  }
 
  if (fpclassify(opa) == FP_NAN) {
    return opb;
  }
 
  if (fpclassify(opb) == FP_NAN) {
    return opa;
  }
 
  // RISC-V spec: -0 < +0
  tmp_a.float_value = opa;
  tmp_b.float_value = opb;
  if (((tmp_a.binary_value == 0x80000000) && (tmp_b.binary_value == 0x00000000)) ||
      ((tmp_a.binary_value == 0x00000000) && (tmp_b.binary_value == 0x80000000))) {
    return +0.0f;
  }
 
  return fmax(opa, opb);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point float to unsigned integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fcvt_wus(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  return (uint32_t)roundf(opa);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point float to signed integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
int32_t __attribute__ ((noinline)) riscv_emulate_fcvt_ws(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  return (int32_t)roundf(opa);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point unsigned integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fcvt_swu(uint32_t rs1) {
 
  return (float)rs1;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point signed integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fcvt_sw(int32_t rs1) {
 
  return (float)rs1;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_feqs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if isless(opa, opb) {
    return 0;
  }
  else if isgreater(opa, opb) {
    return 0;
  }
  else {
    return 1;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_flts(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if isless(opa, opb) {
    return 1;
  }
  else {
    return 0;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than-or-equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fles(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if islessequal(opa, opb) {
    return 1;
  }
  else {
    return 0;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (sign_2 != 0) { // opb is negative
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
  else { // opb is positive
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection NOT
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjns(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (sign_2 != 0) { // opb is negative
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
  else { // opb is positive
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection XOR
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjxs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (((sign_1 == 0) && (sign_2 != 0)) || ((sign_1 != 0) && (sign_2 == 0))) {
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
  else {
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point number classification
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fclasss(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  union {
    uint32_t binary_value; /**< Access as native float */
    float    float_value;  /**< Access in binary representation */
  } aux;
 
  // RISC-V classify result layout
  const uint32_t CLASS_NEG_INF    = 1 << 0; // negative infinity
  const uint32_t CLASS_NEG_NORM   = 1 << 1; // negative normal number
  const uint32_t CLASS_NEG_DENORM = 1 << 2; // negative subnormal number
  const uint32_t CLASS_NEG_ZERO   = 1 << 3; // negative zero
  const uint32_t CLASS_POS_ZERO   = 1 << 4; // positive zero
  const uint32_t CLASS_POS_DENORM = 1 << 5; // positive subnormal number
  const uint32_t CLASS_POS_NORM   = 1 << 6; // positive normal number
  const uint32_t CLASS_POS_INF    = 1 << 7; // positive infinity
  const uint32_t CLASS_SNAN       = 1 << 8; // signaling NaN (sNaN)
  const uint32_t CLASS_QNAN       = 1 << 9; // quiet NaN (qNaN)
 
  int tmp = fpclassify(opa);
  int sgn = (int)signbit(opa);
 
  uint32_t res = 0;
 
  // infinity
  if (tmp == FP_INFINITE) {
    if (sgn) { res |= CLASS_NEG_INF; }
    else     { res |= CLASS_POS_INF; }
  }
 
  // zero
  if (tmp == FP_ZERO) {
    if (sgn) { res |= CLASS_NEG_ZERO; }
    else     { res |= CLASS_POS_ZERO; }
  }
 
  // normal
  if (tmp == FP_NORMAL) {
    if (sgn) { res |= CLASS_NEG_NORM; }
    else     { res |= CLASS_POS_NORM; }
  }
 
  // subnormal
  if (tmp == FP_SUBNORMAL) {
    if (sgn) { res |= CLASS_NEG_DENORM; }
    else     { res |= CLASS_POS_DENORM; }
  }
 
  // NaN
  if (tmp == FP_NAN) {
    aux.float_value = opa;
    if ((aux.binary_value >> 22) & 0b1) { // bit 22 (mantissa's MSB) is set -> canonical (quiet) NAN
      res |= CLASS_QNAN;
    }
    else {
      res |= CLASS_SNAN;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point division
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fdivs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa / opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point square root
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsqrts(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  float res = sqrtf(opa);
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-add
 *
 * @warning This instruction is not supported!
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmadds(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = (opa * opb) + opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-sub
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmsubs(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = (opa * opb) - opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-sub
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fnmsubs(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = -(opa * opb) + opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-add
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fnmadds(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = -(opa * opb) - opc;
  return subnormal_flush(res);
}
 
 
#endif // neorv32_zfinx_extension_intrinsics_h
 

Line No.	Rev	Author	Line
1	55	zero_gravi	`// #################################################################################################`
2			`// # << NEORV32 - Intrinsics + Emulation Functions for the RISC-V "Zfinx" CPU extension >> #`
3			`// # ********************************************************************************************* #`
4			`// # The intrinsics provided by this library allow to use the hardware floating-point unit of the #`
5			`// # RISC-V Zfinx CPU extension without the need for Zfinx support by the compiler / toolchain. #`
6			`// # ********************************************************************************************* #`
7			`// # BSD 3-Clause License #`
8			`// # #`
9	71	zero_gravi	`// # Copyright (c) 2022, Stephan Nolting. All rights reserved. #`
10	55	zero_gravi	`// # #`
11			`// # Redistribution and use in source and binary forms, with or without modification, are #`
12			`// # permitted provided that the following conditions are met: #`
13			`// # #`
14			`// # 1. Redistributions of source code must retain the above copyright notice, this list of #`
15			`// # conditions and the following disclaimer. #`
16			`// # #`
17			`// # 2. Redistributions in binary form must reproduce the above copyright notice, this list of #`
18			`// # conditions and the following disclaimer in the documentation and/or other materials #`
19			`// # provided with the distribution. #`
20			`// # #`
21			`// # 3. Neither the name of the copyright holder nor the names of its contributors may be used to #`
22			`// # endorse or promote products derived from this software without specific prior written #`
23			`// # permission. #`
24			`// # #`
25			`// # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS #`
26			`// # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF #`
27			`// # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE #`
28			`// # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, #`
29			`// # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #`
30			`// # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED #`
31			`// # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING #`
32			`// # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED #`
33			`// # OF THE POSSIBILITY OF SUCH DAMAGE. #`
34			`// # ********************************************************************************************* #`
35			`// # The NEORV32 Processor - https://github.com/stnolting/neorv32 (c) Stephan Nolting #`
36			`// #################################################################################################`
37
38
39			`/********************************************************************//`
40			`* @file floating_point_test/neorv32_zfinx_extension_intrinsics.h`
41			`* @author Stephan Nolting`
42			`*`
43			`* @brief "Intrinsic" library for the NEORV32 single-precision floating-point in x registers (Zfinx) extension`
44			`* @brief Also provides emulation functions for all intrinsics (functionality re-built in pure software). The functionality of the emulation`
45			`* @brief functions is based on the RISC-V floating-point spec.`
46			`*`
47			`* @note All operations from this library use the default GCC "round to nearest, ties to even" rounding mode.`
48			`*`
49			`* @warning This library is just a temporary fall-back until the Zfinx extensions are supported by the upstream RISC-V GCC port.`
50			`**************************************************************************/`
51
52			`#ifndef neorv32_zfinx_extension_intrinsics_h`
53			`#define neorv32_zfinx_extension_intrinsics_h`
54
55			`#define __USE_GNU`
56
57			`#include <fenv.h>`
58			`//#pragma STDC FENV_ACCESS ON`
59
60			`#define _GNU_SOURCE`
61
62			`#include <float.h>`
63			`#include <math.h>`
64
65
66			`/********************************************************************//`
67			`* Sanity check`
68			`**************************************************************************/`
69			`#if defined __riscv_f \|\| (__riscv_flen == 32)`
70			`#error Application programs using the Zfinx intrinsic library have to be compiled WITHOUT the <F> MARCH ISA attribute!`
71			`#endif`
72
73
74			`/********************************************************************//`
75			`* Custom data type to access floating-point values as native floats and in binary representation`
76			`**************************************************************************/`
77			`typedef union`
78			`{`
79			`uint32_t binary_value; /*< Access as native float /`
80			`float float_value; /*< Access in binary representation /`
81			`} float_conv_t;`
82
83
84			`// ################################################################################################`
85			`// Helper functions`
86			`// ################################################################################################`
87
88			`/********************************************************************//`
89	74	zero_gravi	`* Flush to zero if de-normal number.`
90	55	zero_gravi	`*`
91			`* @warning Subnormal numbers are not supported yet! Flush them to zero.`
92			`*`
93	56	zero_gravi	`* @param[in] tmp Source operand.`
94	55	zero_gravi	`* @return Result.`
95			`**************************************************************************/`
96			`float subnormal_flush(float tmp) {`
97
98			`float res = tmp;`
99
100	74	zero_gravi	`// flush to zero if subnormal`
101	55	zero_gravi	`if (fpclassify(tmp) == FP_SUBNORMAL) {`
102			`if (signbit(tmp) != 0) {`
103			`res = -0.0f;`
104			`}`
105			`else {`
106			`res = +0.0f;`
107			`}`
108			`}`
109
110			`return res;`
111			`}`
112
113
114			`// ################################################################################################`
115			`// Exception access`
116			`// ################################################################################################`
117
118			`/********************************************************************//`
119			`* Get exception flags from fflags CSR (floating-point hardware).`
120			`*`
121			`* @return Floating point exception status word.`
122			`**************************************************************************/`
123			`uint32_t get_hw_exceptions(void) {`
124
125			`uint32_t res = neorv32_cpu_csr_read(CSR_FFLAGS);`
126
127			`neorv32_cpu_csr_write(CSR_FFLAGS, 0); // clear status word`
128
129			`return res;`
130			`}`
131
132
133			`/********************************************************************//`
134			`* Get exception flags from C runtime (floating-point emulation).`
135			`*`
136			`* @warning WORK-IN-PROGRESS!`
137			`*`
138			`* @return Floating point exception status word.`
139			`**************************************************************************/`
140			`uint32_t get_sw_exceptions(void) {`
141
142			`const uint32_t FP_EXC_NV_C = 1 << 0; // invalid operation`
143			`const uint32_t FP_EXC_DZ_C = 1 << 1; // divide by zero`
144			`const uint32_t FP_EXC_OF_C = 1 << 2; // overflow`
145			`const uint32_t FP_EXC_UF_C = 1 << 3; // underflow`
146			`const uint32_t FP_EXC_NX_C = 1 << 4; // inexact`
147
148			`int fpeRaised = fetestexcept(FE_ALL_EXCEPT);`
149
150			`uint32_t res = 0;`
151
152			`if (fpeRaised & FE_INVALID) { res \|= FP_EXC_NV_C; }`
153			`if (fpeRaised & FE_DIVBYZERO) { res \|= FP_EXC_DZ_C; }`
154			`if (fpeRaised & FE_OVERFLOW) { res \|= FP_EXC_OF_C; }`
155			`if (fpeRaised & FE_UNDERFLOW) { res \|= FP_EXC_UF_C; }`
156			`if (fpeRaised & FE_INEXACT) { res \|= FP_EXC_NX_C; }`
157
158			`feclearexcept(FE_ALL_EXCEPT);`
159
160			`return res;`
161			`}`
162
163
164			`// ################################################################################################`
165			`// "Intrinsics"`
166			`// ################################################################################################`
167
168			`/********************************************************************//`
169			`* Single-precision floating-point addition`
170			`*`
171	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
172			`* @param[in] rs2 Source operand 2.`
173	55	zero_gravi	`* @return Result.`
174			`**************************************************************************/`
175	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fadds(float rs1, float rs2) {`
176	55	zero_gravi
177			`float_conv_t opa, opb, res;`
178			`opa.float_value = rs1;`
179			`opb.float_value = rs2;`
180
181	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
182	55	zero_gravi	`return res.float_value;`
183			`}`
184
185
186			`/********************************************************************//`
187			`* Single-precision floating-point subtraction`
188			`*`
189	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
190			`* @param[in] rs2 Source operand 2.`
191	55	zero_gravi	`* @return Result.`
192			`**************************************************************************/`
193	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsubs(float rs1, float rs2) {`
194	55	zero_gravi
195			`float_conv_t opa, opb, res;`
196			`opa.float_value = rs1;`
197			`opb.float_value = rs2;`
198
199	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
200	55	zero_gravi	`return res.float_value;`
201			`}`
202
203
204			`/********************************************************************//`
205			`* Single-precision floating-point multiplication`
206			`*`
207	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
208			`* @param[in] rs2 Source operand 2.`
209	55	zero_gravi	`* @return Result.`
210			`**************************************************************************/`
211	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmuls(float rs1, float rs2) {`
212	55	zero_gravi
213			`float_conv_t opa, opb, res;`
214			`opa.float_value = rs1;`
215			`opb.float_value = rs2;`
216
217	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
218	55	zero_gravi	`return res.float_value;`
219			`}`
220
221
222			`/********************************************************************//`
223			`* Single-precision floating-point minimum`
224			`*`
225	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
226			`* @param[in] rs2 Source operand 2.`
227	55	zero_gravi	`* @return Result.`
228			`**************************************************************************/`
229	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmins(float rs1, float rs2) {`
230	55	zero_gravi
231			`float_conv_t opa, opb, res;`
232			`opa.float_value = rs1;`
233			`opb.float_value = rs2;`
234
235	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
236	55	zero_gravi	`return res.float_value;`
237			`}`
238
239
240			`/********************************************************************//`
241			`* Single-precision floating-point maximum`
242			`*`
243	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
244			`* @param[in] rs2 Source operand 2.`
245	55	zero_gravi	`* @return Result.`
246			`**************************************************************************/`
247	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmaxs(float rs1, float rs2) {`
248	55	zero_gravi
249			`float_conv_t opa, opb, res;`
250			`opa.float_value = rs1;`
251			`opb.float_value = rs2;`
252
253	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
254	55	zero_gravi	`return res.float_value;`
255			`}`
256
257
258			`/********************************************************************//`
259			`* Single-precision floating-point convert float to unsigned integer`
260			`*`
261	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
262	55	zero_gravi	`* @return Result.`
263			`**************************************************************************/`
264	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_wus(float rs1) {`
265	55	zero_gravi
266			`float_conv_t opa;`
267			`opa.float_value = rs1;`
268
269	71	zero_gravi	`return CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00001, opa.binary_value, 0b000, 0b1010011);`
270	55	zero_gravi	`}`
271
272
273			`/********************************************************************//`
274			`* Single-precision floating-point convert float to signed integer`
275			`*`
276	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
277	55	zero_gravi	`* @return Result.`
278			`**************************************************************************/`
279	56	zero_gravi	`inline int32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_ws(float rs1) {`
280	55	zero_gravi
281			`float_conv_t opa;`
282			`opa.float_value = rs1;`
283
284	71	zero_gravi	`return (int32_t)CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00000, opa.binary_value, 0b000, 0b1010011);`
285	55	zero_gravi	`}`
286
287
288			`/********************************************************************//`
289			`* Single-precision floating-point convert unsigned integer to float`
290			`*`
291	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
292	55	zero_gravi	`* @return Result.`
293			`**************************************************************************/`
294	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_swu(uint32_t rs1) {`
295	55	zero_gravi
296			`float_conv_t res;`
297
298	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00001, rs1, 0b000, 0b1010011);`
299	55	zero_gravi	`return res.float_value;`
300			`}`
301
302
303			`/********************************************************************//`
304			`* Single-precision floating-point convert signed integer to float`
305			`*`
306	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
307	55	zero_gravi	`* @return Result.`
308			`**************************************************************************/`
309	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_sw(int32_t rs1) {`
310	55	zero_gravi
311			`float_conv_t res;`
312
313	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00000, rs1, 0b000, 0b1010011);`
314	55	zero_gravi	`return res.float_value;`
315			`}`
316
317
318			`/********************************************************************//`
319			`* Single-precision floating-point equal comparison`
320			`*`
321	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
322			`* @param[in] rs2 Source operand 2.`
323	55	zero_gravi	`* @return Result.`
324			`**************************************************************************/`
325	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_feqs(float rs1, float rs2) {`
326	55	zero_gravi
327			`float_conv_t opa, opb;`
328			`opa.float_value = rs1;`
329			`opb.float_value = rs2;`
330
331	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);`
332	55	zero_gravi	`}`
333
334
335			`/********************************************************************//`
336			`* Single-precision floating-point less-than comparison`
337			`*`
338	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
339			`* @param[in] rs2 Source operand 2.`
340	55	zero_gravi	`* @return Result.`
341			`**************************************************************************/`
342	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_flts(float rs1, float rs2) {`
343	55	zero_gravi
344			`float_conv_t opa, opb;`
345			`opa.float_value = rs1;`
346			`opb.float_value = rs2;`
347
348	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
349	55	zero_gravi	`}`
350
351
352			`/********************************************************************//`
353			`* Single-precision floating-point less-than-or-equal comparison`
354			`*`
355	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
356			`* @param[in] rs2 Source operand 2.`
357	55	zero_gravi	`* @return Result.`
358			`**************************************************************************/`
359	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fles(float rs1, float rs2) {`
360	55	zero_gravi
361			`float_conv_t opa, opb;`
362			`opa.float_value = rs1;`
363			`opb.float_value = rs2;`
364
365	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
366	55	zero_gravi	`}`
367
368
369			`/********************************************************************//`
370			`* Single-precision floating-point sign-injection`
371			`*`
372	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
373			`* @param[in] rs2 Source operand 2.`
374	55	zero_gravi	`* @return Result.`
375			`**************************************************************************/`
376	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjs(float rs1, float rs2) {`
377	55	zero_gravi
378			`float_conv_t opa, opb, res;`
379			`opa.float_value = rs1;`
380			`opb.float_value = rs2;`
381
382	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
383	55	zero_gravi	`return res.float_value;`
384			`}`
385
386
387			`/********************************************************************//`
388			`* Single-precision floating-point sign-injection NOT`
389			`*`
390	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
391			`* @param[in] rs2 Source operand 2.`
392	55	zero_gravi	`* @return Result.`
393			`**************************************************************************/`
394	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjns(float rs1, float rs2) {`
395	55	zero_gravi
396			`float_conv_t opa, opb, res;`
397			`opa.float_value = rs1;`
398			`opb.float_value = rs2;`
399
400	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
401	55	zero_gravi	`return res.float_value;`
402			`}`
403
404
405			`/********************************************************************//`
406			`* Single-precision floating-point sign-injection XOR`
407			`*`
408	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
409			`* @param[in] rs2 Source operand 2.`
410	55	zero_gravi	`* @return Result.`
411			`**************************************************************************/`
412	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjxs(float rs1, float rs2) {`
413	55	zero_gravi
414			`float_conv_t opa, opb, res;`
415			`opa.float_value = rs1;`
416			`opb.float_value = rs2;`
417
418	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);`
419	55	zero_gravi	`return res.float_value;`
420			`}`
421
422
423			`/********************************************************************//`
424			`* Single-precision floating-point number classification`
425			`*`
426	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
427	55	zero_gravi	`* @return Result.`
428			`**************************************************************************/`
429	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fclasss(float rs1) {`
430	55	zero_gravi
431			`float_conv_t opa;`
432			`opa.float_value = rs1;`
433
434	71	zero_gravi	`return CUSTOM_INSTR_R1_TYPE(0b1110000, 0b00000, opa.binary_value, 0b001, 0b1010011);`
435	55	zero_gravi	`}`
436
437
438			`// ################################################################################################`
439			`// !!! UNSUPPORTED instructions !!!`
440			`// ################################################################################################`
441
442			`/********************************************************************//`
443			`* Single-precision floating-point division`
444			`*`
445			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
446			`*`
447	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
448			`* @param[in] rs2 Source operand 2.`
449	55	zero_gravi	`* @return Result.`
450			`**************************************************************************/`
451	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fdivs(float rs1, float rs2) {`
452	55	zero_gravi
453			`float_conv_t opa, opb, res;`
454			`opa.float_value = rs1;`
455			`opb.float_value = rs2;`
456
457	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
458	55	zero_gravi	`return res.float_value;`
459			`}`
460
461
462			`/********************************************************************//`
463			`* Single-precision floating-point square root`
464			`*`
465			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
466			`*`
467	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
468	55	zero_gravi	`* @return Result.`
469			`**************************************************************************/`
470	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsqrts(float rs1) {`
471	55	zero_gravi
472			`float_conv_t opa, res;`
473			`opa.float_value = rs1;`
474
475	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b0101100, 0b00000, opa.binary_value, 0b000, 0b1010011);`
476	55	zero_gravi	`return res.float_value;`
477			`}`
478
479
480			`/********************************************************************//`
481			`* Single-precision floating-point fused multiply-add`
482			`*`
483			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
484			`*`
485	71	zero_gravi	`* @param[in] rs1 Source operand 1`
486			`* @param[in] rs2 Source operand 2`
487			`* @param[in] rs3 Source operand 3`
488	55	zero_gravi	`* @return Result.`
489			`**************************************************************************/`
490	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmadds(float rs1, float rs2, float rs3) {`
491	55	zero_gravi
492			`float_conv_t opa, opb, opc, res;`
493			`opa.float_value = rs1;`
494			`opb.float_value = rs2;`
495			`opc.float_value = rs3;`
496
497	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000011);`
498	55	zero_gravi	`return res.float_value;`
499			`}`
500

Browse

Tools

Subversion Repositories neorv32

[/] [neorv32/] [trunk/] [sw/] [example/] [floating_point_test/] [neorv32_zfinx_extension_intrinsics.h] - Blame information for rev 74