URL https://opencores.org/ocsvn/neorv32/neorv32/trunk

Subversion Repositories neorv32

[/] [neorv32/] [trunk/] [sw/] [example/] [floating_point_test/] [neorv32_zfinx_extension_intrinsics.h] - Blame information for rev 71

Go to most recent revision | Details | Compare with Previous | View Log


// #################################################################################################
// # << NEORV32 - Intrinsics + Emulation Functions for the RISC-V "Zfinx" CPU extension >>         #
// # ********************************************************************************************* #
// # The intrinsics provided by this library allow to use the hardware floating-point unit of the  #
// # RISC-V Zfinx CPU extension without the need for Zfinx support by the compiler / toolchain.    #
// # ********************************************************************************************* #
// # BSD 3-Clause License                                                                          #
// #                                                                                               #
// # Copyright (c) 2022, Stephan Nolting. All rights reserved.                                     #
// #                                                                                               #
// # Redistribution and use in source and binary forms, with or without modification, are          #
// # permitted provided that the following conditions are met:                                     #
// #                                                                                               #
// # 1. Redistributions of source code must retain the above copyright notice, this list of        #
// #    conditions and the following disclaimer.                                                   #
// #                                                                                               #
// # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #
// #    conditions and the following disclaimer in the documentation and/or other materials        #
// #    provided with the distribution.                                                            #
// #                                                                                               #
// # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #
// #    endorse or promote products derived from this software without specific prior written      #
// #    permission.                                                                                #
// #                                                                                               #
// # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #
// # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #
// # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #
// # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #
// # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #
// # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #
// # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #
// # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #
// # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #
// # ********************************************************************************************* #
// # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #
// #################################################################################################
 
 
/**********************************************************************//**
 * @file floating_point_test/neorv32_zfinx_extension_intrinsics.h
 * @author Stephan Nolting
 *
 * @brief "Intrinsic" library for the NEORV32 single-precision floating-point in x registers (Zfinx) extension
 * @brief Also provides emulation functions for all intrinsics (functionality re-built in pure software). The functionality of the emulation
 * @brief functions is based on the RISC-V floating-point spec.
 *
 * @note All operations from this library use the default GCC "round to nearest, ties to even" rounding mode.
 *
 * @warning This library is just a temporary fall-back until the Zfinx extensions are supported by the upstream RISC-V GCC port.
 **************************************************************************/
 
#ifndef neorv32_zfinx_extension_intrinsics_h
#define neorv32_zfinx_extension_intrinsics_h
 
#define __USE_GNU
 
#include <fenv.h>
//#pragma STDC FENV_ACCESS ON
 
#define _GNU_SOURCE
 
#include <float.h>
#include <math.h>
 
 
/**********************************************************************//**
 * Sanity check
 **************************************************************************/
#if defined __riscv_f || (__riscv_flen == 32)
  #error Application programs using the Zfinx intrinsic library have to be compiled WITHOUT the <F> MARCH ISA attribute!
#endif
 
 
/**********************************************************************//**
 * Custom data type to access floating-point values as native floats and in binary representation
 **************************************************************************/
typedef union
{
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
} float_conv_t;
 
 
// ################################################################################################
// Helper functions
// ################################################################################################
 
/**********************************************************************//**
 * Flush to zero if denormal number.
 *
 * @warning Subnormal numbers are not supported yet! Flush them to zero.
 *
 * @param[in] tmp Source operand.
 * @return Result.
 **************************************************************************/
float subnormal_flush(float tmp) {
 
  float res = tmp;
 
  if (fpclassify(tmp) == FP_SUBNORMAL) {
    if (signbit(tmp) != 0) {
      res = -0.0f;
    }
    else {
      res = +0.0f;
    }
  }
 
  return res;
}
 
 
// ################################################################################################
// Exception access
// ################################################################################################
 
/**********************************************************************//**
 * Get exception flags from fflags CSR (floating-point hardware).
 *
 * @return Floating point exception status word.
 **************************************************************************/
uint32_t get_hw_exceptions(void) {
 
  uint32_t res = neorv32_cpu_csr_read(CSR_FFLAGS);
 
  neorv32_cpu_csr_write(CSR_FFLAGS, 0); // clear status word
 
  return res;
}
 
 
/**********************************************************************//**
 * Get exception flags from C runtime (floating-point emulation).
 *
 * @warning WORK-IN-PROGRESS!
 *
 * @return Floating point exception status word.
 **************************************************************************/
uint32_t get_sw_exceptions(void) {
 
  const uint32_t FP_EXC_NV_C = 1 << 0; // invalid operation
  const uint32_t FP_EXC_DZ_C = 1 << 1; // divide by zero
  const uint32_t FP_EXC_OF_C = 1 << 2; // overflow
  const uint32_t FP_EXC_UF_C = 1 << 3; // underflow
  const uint32_t FP_EXC_NX_C = 1 << 4; // inexact
 
  int fpeRaised = fetestexcept(FE_ALL_EXCEPT);
 
  uint32_t res = 0;
 
  if (fpeRaised & FE_INVALID)   { res |= FP_EXC_NV_C; }
  if (fpeRaised & FE_DIVBYZERO) { res |= FP_EXC_DZ_C; }
  if (fpeRaised & FE_OVERFLOW)  { res |= FP_EXC_OF_C; }
  if (fpeRaised & FE_UNDERFLOW) { res |= FP_EXC_UF_C; }
  if (fpeRaised & FE_INEXACT)   { res |= FP_EXC_NX_C; }
 
  feclearexcept(FE_ALL_EXCEPT);
 
  return res;
}
 
 
// ################################################################################################
// "Intrinsics"
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point addition
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fadds(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point subtraction
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsubs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point multiplication
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmuls(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point minimum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmins(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point maximum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmaxs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert float to unsigned integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_wus(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00001, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert float to signed integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline int32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_ws(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return (int32_t)CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00000, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert unsigned integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_swu(uint32_t rs1) {
 
  float_conv_t res;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00001, rs1, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point convert signed integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_sw(int32_t rs1) {
 
  float_conv_t res;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00000, rs1, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_feqs(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_flts(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than-or-equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fles(float rs1, float rs2) {
 
  float_conv_t opa, opb;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection NOT
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjns(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection XOR
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjxs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point number classification
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fclasss(float rs1) {
 
  float_conv_t opa;
  opa.float_value = rs1;
 
  return CUSTOM_INSTR_R1_TYPE(0b1110000, 0b00000, opa.binary_value, 0b001, 0b1010011);
}
 
 
// ################################################################################################
// !!! UNSUPPORTED instructions !!!
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point division
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fdivs(float rs1, float rs2) {
 
  float_conv_t opa, opb, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
 
  res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point square root
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fsqrts(float rs1) {
 
  float_conv_t opa, res;
  opa.float_value = rs1;
 
  res.binary_value = CUSTOM_INSTR_R1_TYPE(0b0101100, 0b00000, opa.binary_value, 0b000, 0b1010011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-add
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmadds(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-sub
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fmsubs(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000111);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-sub
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fnmsubs(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1001011);
  return res.float_value;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-add
 *
 * @warning This instruction is not supported and should raise an illegal instruction exception when executed.
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
inline float __attribute__ ((always_inline)) riscv_intrinsic_fnmadds(float rs1, float rs2, float rs3) {
 
  float_conv_t opa, opb, opc, res;
  opa.float_value = rs1;
  opb.float_value = rs2;
  opc.float_value = rs3;
 
  res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1001111);
  return res.float_value;
}
 
 
// ################################################################################################
// Emulation functions
// ################################################################################################
 
/**********************************************************************//**
 * Single-precision floating-point addition
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fadds(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa + opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point subtraction
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsubs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa - opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point multiplication
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmuls(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa * opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point minimum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmins(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  union {
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
  } tmp_a, tmp_b;
 
  if ((fpclassify(opa) == FP_NAN) && (fpclassify(opb) == FP_NAN)) {
    return nanf("");
  }
 
  if (fpclassify(opa) == FP_NAN) {
    return opb;
  }
 
  if (fpclassify(opb) == FP_NAN) {
    return opa;
  }
 
  // RISC-V spec: -0 < +0
  tmp_a.float_value = opa;
  tmp_b.float_value = opb;
  if (((tmp_a.binary_value == 0x80000000) && (tmp_b.binary_value == 0x00000000)) ||
      ((tmp_a.binary_value == 0x00000000) && (tmp_b.binary_value == 0x80000000))) {
    return -0.0f;
  }
 
  return fmin(opa, opb);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point maximum
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmaxs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  union {
  uint32_t binary_value; /**< Access as native float */
  float    float_value;  /**< Access in binary representation */
  } tmp_a, tmp_b;
 
 
  if ((fpclassify(opa) == FP_NAN) && (fpclassify(opb) == FP_NAN)) {
    return nanf("");
  }
 
  if (fpclassify(opa) == FP_NAN) {
    return opb;
  }
 
  if (fpclassify(opb) == FP_NAN) {
    return opa;
  }
 
  // RISC-V spec: -0 < +0
  tmp_a.float_value = opa;
  tmp_b.float_value = opb;
  if (((tmp_a.binary_value == 0x80000000) && (tmp_b.binary_value == 0x00000000)) ||
      ((tmp_a.binary_value == 0x00000000) && (tmp_b.binary_value == 0x80000000))) {
    return +0.0f;
  }
 
  return fmax(opa, opb);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point float to unsigned integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fcvt_wus(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  return (uint32_t)roundf(opa);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point float to signed integer
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
int32_t __attribute__ ((noinline)) riscv_emulate_fcvt_ws(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  return (int32_t)roundf(opa);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point unsigned integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fcvt_swu(uint32_t rs1) {
 
  return (float)rs1;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point signed integer to float
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fcvt_sw(int32_t rs1) {
 
  return (float)rs1;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_feqs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if isless(opa, opb) {
    return 0;
  }
  else if isgreater(opa, opb) {
    return 0;
  }
  else {
    return 1;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_flts(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if isless(opa, opb) {
    return 1;
  }
  else {
    return 0;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point less-than-or-equal comparison
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fles(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  if ((fpclassify(opa) == FP_NAN) || (fpclassify(opb) == FP_NAN)) {
    return 0;
  }
 
  if islessequal(opa, opb) {
    return 1;
  }
  else {
    return 0;
  }
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (sign_2 != 0) { // opb is negative
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
  else { // opb is positive
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection NOT
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjns(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (sign_2 != 0) { // opb is negative
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
  else { // opb is positive
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point sign-injection XOR
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsgnjxs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  int sign_1 = (int)signbit(opa);
  int sign_2 = (int)signbit(opb);
  float res = 0;
 
  if (((sign_1 == 0) && (sign_2 != 0)) || ((sign_1 != 0) && (sign_2 == 0))) {
    if (sign_1 == 0) {
      res = -opa;
    }
    else {
      res = opa;
    }
  }
  else {
    if (sign_1 == 0) {
      res = opa;
    }
    else {
      res = -opa;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point number classification
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
uint32_t __attribute__ ((noinline)) riscv_emulate_fclasss(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  union {
    uint32_t binary_value; /**< Access as native float */
    float    float_value;  /**< Access in binary representation */
  } aux;
 
  // RISC-V classify result layout
  const uint32_t CLASS_NEG_INF    = 1 << 0; // negative infinity
  const uint32_t CLASS_NEG_NORM   = 1 << 1; // negative normal number
  const uint32_t CLASS_NEG_DENORM = 1 << 2; // negative subnormal number
  const uint32_t CLASS_NEG_ZERO   = 1 << 3; // negative zero
  const uint32_t CLASS_POS_ZERO   = 1 << 4; // positive zero
  const uint32_t CLASS_POS_DENORM = 1 << 5; // positive subnormal number
  const uint32_t CLASS_POS_NORM   = 1 << 6; // positive normal number
  const uint32_t CLASS_POS_INF    = 1 << 7; // positive infinity
  const uint32_t CLASS_SNAN       = 1 << 8; // signaling NaN (sNaN)
  const uint32_t CLASS_QNAN       = 1 << 9; // quiet NaN (qNaN)
 
  int tmp = fpclassify(opa);
  int sgn = (int)signbit(opa);
 
  uint32_t res = 0;
 
  // infinity
  if (tmp == FP_INFINITE) {
    if (sgn) { res |= CLASS_NEG_INF; }
    else     { res |= CLASS_POS_INF; }
  }
 
  // zero
  if (tmp == FP_ZERO) {
    if (sgn) { res |= CLASS_NEG_ZERO; }
    else     { res |= CLASS_POS_ZERO; }
  }
 
  // normal
  if (tmp == FP_NORMAL) {
    if (sgn) { res |= CLASS_NEG_NORM; }
    else     { res |= CLASS_POS_NORM; }
  }
 
  // subnormal
  if (tmp == FP_SUBNORMAL) {
    if (sgn) { res |= CLASS_NEG_DENORM; }
    else     { res |= CLASS_POS_DENORM; }
  }
 
  // NaN
  if (tmp == FP_NAN) {
    aux.float_value = opa;
    if ((aux.binary_value >> 22) & 0b1) { // bit 22 (mantissa's MSB) is set -> canonical (quiet) NAN
      res |= CLASS_QNAN;
    }
    else {
      res |= CLASS_SNAN;
    }
  }
 
  return res;
}
 
 
/**********************************************************************//**
 * Single-precision floating-point division
 *
 * @param[in] rs1 Source operand 1.
 * @param[in] rs2 Source operand 2.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fdivs(float rs1, float rs2) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
 
  float res = opa / opb;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point square root
 *
 * @param[in] rs1 Source operand 1.
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fsqrts(float rs1) {
 
  float opa = subnormal_flush(rs1);
 
  float res = sqrtf(opa);
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-add
 *
 * @warning This instruction is not supported!
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmadds(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = (opa * opb) + opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused multiply-sub
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fmsubs(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = (opa * opb) - opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-sub
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fnmsubs(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = -(opa * opb) + opc;
  return subnormal_flush(res);
}
 
 
/**********************************************************************//**
 * Single-precision floating-point fused negated multiply-add
 *
 * @param[in] rs1 Source operand 1
 * @param[in] rs2 Source operand 2
 * @param[in] rs3 Source operand 3
 * @return Result.
 **************************************************************************/
float __attribute__ ((noinline)) riscv_emulate_fnmadds(float rs1, float rs2, float rs3) {
 
  float opa = subnormal_flush(rs1);
  float opb = subnormal_flush(rs2);
  float opc = subnormal_flush(rs3);
 
  float res = -(opa * opb) - opc;
  return subnormal_flush(res);
}
 
 
#endif // neorv32_zfinx_extension_intrinsics_h
 

Line No.	Rev	Author	Line
1	55	zero_gravi	`// #################################################################################################`
2			`// # << NEORV32 - Intrinsics + Emulation Functions for the RISC-V "Zfinx" CPU extension >> #`
3			`// # ********************************************************************************************* #`
4			`// # The intrinsics provided by this library allow to use the hardware floating-point unit of the #`
5			`// # RISC-V Zfinx CPU extension without the need for Zfinx support by the compiler / toolchain. #`
6			`// # ********************************************************************************************* #`
7			`// # BSD 3-Clause License #`
8			`// # #`
9	71	zero_gravi	`// # Copyright (c) 2022, Stephan Nolting. All rights reserved. #`
10	55	zero_gravi	`// # #`
11			`// # Redistribution and use in source and binary forms, with or without modification, are #`
12			`// # permitted provided that the following conditions are met: #`
13			`// # #`
14			`// # 1. Redistributions of source code must retain the above copyright notice, this list of #`
15			`// # conditions and the following disclaimer. #`
16			`// # #`
17			`// # 2. Redistributions in binary form must reproduce the above copyright notice, this list of #`
18			`// # conditions and the following disclaimer in the documentation and/or other materials #`
19			`// # provided with the distribution. #`
20			`// # #`
21			`// # 3. Neither the name of the copyright holder nor the names of its contributors may be used to #`
22			`// # endorse or promote products derived from this software without specific prior written #`
23			`// # permission. #`
24			`// # #`
25			`// # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS #`
26			`// # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF #`
27			`// # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE #`
28			`// # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, #`
29			`// # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #`
30			`// # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED #`
31			`// # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING #`
32			`// # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED #`
33			`// # OF THE POSSIBILITY OF SUCH DAMAGE. #`
34			`// # ********************************************************************************************* #`
35			`// # The NEORV32 Processor - https://github.com/stnolting/neorv32 (c) Stephan Nolting #`
36			`// #################################################################################################`
37
38
39			`/********************************************************************//`
40			`* @file floating_point_test/neorv32_zfinx_extension_intrinsics.h`
41			`* @author Stephan Nolting`
42			`*`
43			`* @brief "Intrinsic" library for the NEORV32 single-precision floating-point in x registers (Zfinx) extension`
44			`* @brief Also provides emulation functions for all intrinsics (functionality re-built in pure software). The functionality of the emulation`
45			`* @brief functions is based on the RISC-V floating-point spec.`
46			`*`
47			`* @note All operations from this library use the default GCC "round to nearest, ties to even" rounding mode.`
48			`*`
49			`* @warning This library is just a temporary fall-back until the Zfinx extensions are supported by the upstream RISC-V GCC port.`
50			`**************************************************************************/`
51
52			`#ifndef neorv32_zfinx_extension_intrinsics_h`
53			`#define neorv32_zfinx_extension_intrinsics_h`
54
55			`#define __USE_GNU`
56
57			`#include <fenv.h>`
58			`//#pragma STDC FENV_ACCESS ON`
59
60			`#define _GNU_SOURCE`
61
62			`#include <float.h>`
63			`#include <math.h>`
64
65
66			`/********************************************************************//`
67			`* Sanity check`
68			`**************************************************************************/`
69			`#if defined __riscv_f \|\| (__riscv_flen == 32)`
70			`#error Application programs using the Zfinx intrinsic library have to be compiled WITHOUT the <F> MARCH ISA attribute!`
71			`#endif`
72
73
74			`/********************************************************************//`
75			`* Custom data type to access floating-point values as native floats and in binary representation`
76			`**************************************************************************/`
77			`typedef union`
78			`{`
79			`uint32_t binary_value; /*< Access as native float /`
80			`float float_value; /*< Access in binary representation /`
81			`} float_conv_t;`
82
83
84			`// ################################################################################################`
85			`// Helper functions`
86			`// ################################################################################################`
87
88			`/********************************************************************//`
89			`* Flush to zero if denormal number.`
90			`*`
91			`* @warning Subnormal numbers are not supported yet! Flush them to zero.`
92			`*`
93	56	zero_gravi	`* @param[in] tmp Source operand.`
94	55	zero_gravi	`* @return Result.`
95			`**************************************************************************/`
96			`float subnormal_flush(float tmp) {`
97
98			`float res = tmp;`
99
100			`if (fpclassify(tmp) == FP_SUBNORMAL) {`
101			`if (signbit(tmp) != 0) {`
102			`res = -0.0f;`
103			`}`
104			`else {`
105			`res = +0.0f;`
106			`}`
107			`}`
108
109			`return res;`
110			`}`
111
112
113			`// ################################################################################################`
114			`// Exception access`
115			`// ################################################################################################`
116
117			`/********************************************************************//`
118			`* Get exception flags from fflags CSR (floating-point hardware).`
119			`*`
120			`* @return Floating point exception status word.`
121			`**************************************************************************/`
122			`uint32_t get_hw_exceptions(void) {`
123
124			`uint32_t res = neorv32_cpu_csr_read(CSR_FFLAGS);`
125
126			`neorv32_cpu_csr_write(CSR_FFLAGS, 0); // clear status word`
127
128			`return res;`
129			`}`
130
131
132			`/********************************************************************//`
133			`* Get exception flags from C runtime (floating-point emulation).`
134			`*`
135			`* @warning WORK-IN-PROGRESS!`
136			`*`
137			`* @return Floating point exception status word.`
138			`**************************************************************************/`
139			`uint32_t get_sw_exceptions(void) {`
140
141			`const uint32_t FP_EXC_NV_C = 1 << 0; // invalid operation`
142			`const uint32_t FP_EXC_DZ_C = 1 << 1; // divide by zero`
143			`const uint32_t FP_EXC_OF_C = 1 << 2; // overflow`
144			`const uint32_t FP_EXC_UF_C = 1 << 3; // underflow`
145			`const uint32_t FP_EXC_NX_C = 1 << 4; // inexact`
146
147			`int fpeRaised = fetestexcept(FE_ALL_EXCEPT);`
148
149			`uint32_t res = 0;`
150
151			`if (fpeRaised & FE_INVALID) { res \|= FP_EXC_NV_C; }`
152			`if (fpeRaised & FE_DIVBYZERO) { res \|= FP_EXC_DZ_C; }`
153			`if (fpeRaised & FE_OVERFLOW) { res \|= FP_EXC_OF_C; }`
154			`if (fpeRaised & FE_UNDERFLOW) { res \|= FP_EXC_UF_C; }`
155			`if (fpeRaised & FE_INEXACT) { res \|= FP_EXC_NX_C; }`
156
157			`feclearexcept(FE_ALL_EXCEPT);`
158
159			`return res;`
160			`}`
161
162
163			`// ################################################################################################`
164			`// "Intrinsics"`
165			`// ################################################################################################`
166
167			`/********************************************************************//`
168			`* Single-precision floating-point addition`
169			`*`
170	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
171			`* @param[in] rs2 Source operand 2.`
172	55	zero_gravi	`* @return Result.`
173			`**************************************************************************/`
174	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fadds(float rs1, float rs2) {`
175	55	zero_gravi
176			`float_conv_t opa, opb, res;`
177			`opa.float_value = rs1;`
178			`opb.float_value = rs2;`
179
180	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
181	55	zero_gravi	`return res.float_value;`
182			`}`
183
184
185			`/********************************************************************//`
186			`* Single-precision floating-point subtraction`
187			`*`
188	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
189			`* @param[in] rs2 Source operand 2.`
190	55	zero_gravi	`* @return Result.`
191			`**************************************************************************/`
192	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsubs(float rs1, float rs2) {`
193	55	zero_gravi
194			`float_conv_t opa, opb, res;`
195			`opa.float_value = rs1;`
196			`opb.float_value = rs2;`
197
198	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0000100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
199	55	zero_gravi	`return res.float_value;`
200			`}`
201
202
203			`/********************************************************************//`
204			`* Single-precision floating-point multiplication`
205			`*`
206	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
207			`* @param[in] rs2 Source operand 2.`
208	55	zero_gravi	`* @return Result.`
209			`**************************************************************************/`
210	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmuls(float rs1, float rs2) {`
211	55	zero_gravi
212			`float_conv_t opa, opb, res;`
213			`opa.float_value = rs1;`
214			`opb.float_value = rs2;`
215
216	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
217	55	zero_gravi	`return res.float_value;`
218			`}`
219
220
221			`/********************************************************************//`
222			`* Single-precision floating-point minimum`
223			`*`
224	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
225			`* @param[in] rs2 Source operand 2.`
226	55	zero_gravi	`* @return Result.`
227			`**************************************************************************/`
228	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmins(float rs1, float rs2) {`
229	55	zero_gravi
230			`float_conv_t opa, opb, res;`
231			`opa.float_value = rs1;`
232			`opb.float_value = rs2;`
233
234	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
235	55	zero_gravi	`return res.float_value;`
236			`}`
237
238
239			`/********************************************************************//`
240			`* Single-precision floating-point maximum`
241			`*`
242	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
243			`* @param[in] rs2 Source operand 2.`
244	55	zero_gravi	`* @return Result.`
245			`**************************************************************************/`
246	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmaxs(float rs1, float rs2) {`
247	55	zero_gravi
248			`float_conv_t opa, opb, res;`
249			`opa.float_value = rs1;`
250			`opb.float_value = rs2;`
251
252	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010100, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
253	55	zero_gravi	`return res.float_value;`
254			`}`
255
256
257			`/********************************************************************//`
258			`* Single-precision floating-point convert float to unsigned integer`
259			`*`
260	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
261	55	zero_gravi	`* @return Result.`
262			`**************************************************************************/`
263	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_wus(float rs1) {`
264	55	zero_gravi
265			`float_conv_t opa;`
266			`opa.float_value = rs1;`
267
268	71	zero_gravi	`return CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00001, opa.binary_value, 0b000, 0b1010011);`
269	55	zero_gravi	`}`
270
271
272			`/********************************************************************//`
273			`* Single-precision floating-point convert float to signed integer`
274			`*`
275	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
276	55	zero_gravi	`* @return Result.`
277			`**************************************************************************/`
278	56	zero_gravi	`inline int32_t __attribute__ ((always_inline)) riscv_intrinsic_fcvt_ws(float rs1) {`
279	55	zero_gravi
280			`float_conv_t opa;`
281			`opa.float_value = rs1;`
282
283	71	zero_gravi	`return (int32_t)CUSTOM_INSTR_R1_TYPE(0b1100000, 0b00000, opa.binary_value, 0b000, 0b1010011);`
284	55	zero_gravi	`}`
285
286
287			`/********************************************************************//`
288			`* Single-precision floating-point convert unsigned integer to float`
289			`*`
290	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
291	55	zero_gravi	`* @return Result.`
292			`**************************************************************************/`
293	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_swu(uint32_t rs1) {`
294	55	zero_gravi
295			`float_conv_t res;`
296
297	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00001, rs1, 0b000, 0b1010011);`
298	55	zero_gravi	`return res.float_value;`
299			`}`
300
301
302			`/********************************************************************//`
303			`* Single-precision floating-point convert signed integer to float`
304			`*`
305	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
306	55	zero_gravi	`* @return Result.`
307			`**************************************************************************/`
308	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fcvt_sw(int32_t rs1) {`
309	55	zero_gravi
310			`float_conv_t res;`
311
312	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b1101000, 0b00000, rs1, 0b000, 0b1010011);`
313	55	zero_gravi	`return res.float_value;`
314			`}`
315
316
317			`/********************************************************************//`
318			`* Single-precision floating-point equal comparison`
319			`*`
320	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
321			`* @param[in] rs2 Source operand 2.`
322	55	zero_gravi	`* @return Result.`
323			`**************************************************************************/`
324	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_feqs(float rs1, float rs2) {`
325	55	zero_gravi
326			`float_conv_t opa, opb;`
327			`opa.float_value = rs1;`
328			`opb.float_value = rs2;`
329
330	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);`
331	55	zero_gravi	`}`
332
333
334			`/********************************************************************//`
335			`* Single-precision floating-point less-than comparison`
336			`*`
337	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
338			`* @param[in] rs2 Source operand 2.`
339	55	zero_gravi	`* @return Result.`
340			`**************************************************************************/`
341	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_flts(float rs1, float rs2) {`
342	55	zero_gravi
343			`float_conv_t opa, opb;`
344			`opa.float_value = rs1;`
345			`opb.float_value = rs2;`
346
347	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
348	55	zero_gravi	`}`
349
350
351			`/********************************************************************//`
352			`* Single-precision floating-point less-than-or-equal comparison`
353			`*`
354	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
355			`* @param[in] rs2 Source operand 2.`
356	55	zero_gravi	`* @return Result.`
357			`**************************************************************************/`
358	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fles(float rs1, float rs2) {`
359	55	zero_gravi
360			`float_conv_t opa, opb;`
361			`opa.float_value = rs1;`
362			`opb.float_value = rs2;`
363
364	71	zero_gravi	`return CUSTOM_INSTR_R2_TYPE(0b1010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
365	55	zero_gravi	`}`
366
367
368			`/********************************************************************//`
369			`* Single-precision floating-point sign-injection`
370			`*`
371	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
372			`* @param[in] rs2 Source operand 2.`
373	55	zero_gravi	`* @return Result.`
374			`**************************************************************************/`
375	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjs(float rs1, float rs2) {`
376	55	zero_gravi
377			`float_conv_t opa, opb, res;`
378			`opa.float_value = rs1;`
379			`opb.float_value = rs2;`
380
381	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
382	55	zero_gravi	`return res.float_value;`
383			`}`
384
385
386			`/********************************************************************//`
387			`* Single-precision floating-point sign-injection NOT`
388			`*`
389	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
390			`* @param[in] rs2 Source operand 2.`
391	55	zero_gravi	`* @return Result.`
392			`**************************************************************************/`
393	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjns(float rs1, float rs2) {`
394	55	zero_gravi
395			`float_conv_t opa, opb, res;`
396			`opa.float_value = rs1;`
397			`opb.float_value = rs2;`
398
399	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b001, 0b1010011);`
400	55	zero_gravi	`return res.float_value;`
401			`}`
402
403
404			`/********************************************************************//`
405			`* Single-precision floating-point sign-injection XOR`
406			`*`
407	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
408			`* @param[in] rs2 Source operand 2.`
409	55	zero_gravi	`* @return Result.`
410			`**************************************************************************/`
411	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsgnjxs(float rs1, float rs2) {`
412	55	zero_gravi
413			`float_conv_t opa, opb, res;`
414			`opa.float_value = rs1;`
415			`opb.float_value = rs2;`
416
417	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0010000, opb.binary_value, opa.binary_value, 0b010, 0b1010011);`
418	55	zero_gravi	`return res.float_value;`
419			`}`
420
421
422			`/********************************************************************//`
423			`* Single-precision floating-point number classification`
424			`*`
425	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
426	55	zero_gravi	`* @return Result.`
427			`**************************************************************************/`
428	56	zero_gravi	`inline uint32_t __attribute__ ((always_inline)) riscv_intrinsic_fclasss(float rs1) {`
429	55	zero_gravi
430			`float_conv_t opa;`
431			`opa.float_value = rs1;`
432
433	71	zero_gravi	`return CUSTOM_INSTR_R1_TYPE(0b1110000, 0b00000, opa.binary_value, 0b001, 0b1010011);`
434	55	zero_gravi	`}`
435
436
437			`// ################################################################################################`
438			`// !!! UNSUPPORTED instructions !!!`
439			`// ################################################################################################`
440
441			`/********************************************************************//`
442			`* Single-precision floating-point division`
443			`*`
444			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
445			`*`
446	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
447			`* @param[in] rs2 Source operand 2.`
448	55	zero_gravi	`* @return Result.`
449			`**************************************************************************/`
450	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fdivs(float rs1, float rs2) {`
451	55	zero_gravi
452			`float_conv_t opa, opb, res;`
453			`opa.float_value = rs1;`
454			`opb.float_value = rs2;`
455
456	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R2_TYPE(0b0001100, opb.binary_value, opa.binary_value, 0b000, 0b1010011);`
457	55	zero_gravi	`return res.float_value;`
458			`}`
459
460
461			`/********************************************************************//`
462			`* Single-precision floating-point square root`
463			`*`
464			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
465			`*`
466	71	zero_gravi	`* @param[in] rs1 Source operand 1.`
467	55	zero_gravi	`* @return Result.`
468			`**************************************************************************/`
469	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fsqrts(float rs1) {`
470	55	zero_gravi
471			`float_conv_t opa, res;`
472			`opa.float_value = rs1;`
473
474	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R1_TYPE(0b0101100, 0b00000, opa.binary_value, 0b000, 0b1010011);`
475	55	zero_gravi	`return res.float_value;`
476			`}`
477
478
479			`/********************************************************************//`
480			`* Single-precision floating-point fused multiply-add`
481			`*`
482			`* @warning This instruction is not supported and should raise an illegal instruction exception when executed.`
483			`*`
484	71	zero_gravi	`* @param[in] rs1 Source operand 1`
485			`* @param[in] rs2 Source operand 2`
486			`* @param[in] rs3 Source operand 3`
487	55	zero_gravi	`* @return Result.`
488			`**************************************************************************/`
489	56	zero_gravi	`inline float __attribute__ ((always_inline)) riscv_intrinsic_fmadds(float rs1, float rs2, float rs3) {`
490	55	zero_gravi
491			`float_conv_t opa, opb, opc, res;`
492			`opa.float_value = rs1;`
493			`opb.float_value = rs2;`
494			`opc.float_value = rs3;`
495
496	71	zero_gravi	`res.binary_value = CUSTOM_INSTR_R3_TYPE(opc.binary_value, opb.binary_value, opa.binary_value, 0b000, 0b1000011);`
497	55	zero_gravi	`return res.float_value;`
498			`}`
499
500

Browse

Tools

Subversion Repositories neorv32

[/] [neorv32/] [trunk/] [sw/] [example/] [floating_point_test/] [neorv32_zfinx_extension_intrinsics.h] - Blame information for rev 71