Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1 | /* |
Taylor Simpson | dae386b | 2023-03-06 18:58:18 -0800 | [diff] [blame] | 2 | * Copyright(c) 2019-2023 Qualcomm Innovation Center, Inc. All Rights Reserved. |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 3 | * |
| 4 | * This program is free software; you can redistribute it and/or modify |
| 5 | * it under the terms of the GNU General Public License as published by |
| 6 | * the Free Software Foundation; either version 2 of the License, or |
| 7 | * (at your option) any later version. |
| 8 | * |
| 9 | * This program is distributed in the hope that it will be useful, |
| 10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 12 | * GNU General Public License for more details. |
| 13 | * |
| 14 | * You should have received a copy of the GNU General Public License |
| 15 | * along with this program; if not, see <http://www.gnu.org/licenses/>. |
| 16 | */ |
| 17 | |
| 18 | #include "qemu/osdep.h" |
Peter Maydell | 25fc9b7 | 2021-07-17 11:30:17 +0100 | [diff] [blame] | 19 | #include "qemu/log.h" |
| 20 | #include "exec/exec-all.h" |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 21 | #include "exec/cpu_ldst.h" |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 22 | #include "exec/helper-proto.h" |
| 23 | #include "fpu/softfloat.h" |
| 24 | #include "cpu.h" |
| 25 | #include "internal.h" |
| 26 | #include "macros.h" |
| 27 | #include "arch.h" |
| 28 | #include "hex_arch_types.h" |
| 29 | #include "fma_emu.h" |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 30 | #include "mmvec/mmvec.h" |
| 31 | #include "mmvec/macros.h" |
Paolo Montesel | 7e8b3b3 | 2022-09-23 19:38:24 +0200 | [diff] [blame] | 32 | #include "op_helper.h" |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 33 | #include "translate.h" |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 34 | |
| 35 | #define SF_BIAS 127 |
| 36 | #define SF_MANTBITS 23 |
| 37 | |
| 38 | /* Exceptions processing helpers */ |
Matheus Tavares Bernardino | e1b526f | 2024-05-03 13:53:15 -0300 | [diff] [blame] | 39 | G_NORETURN void hexagon_raise_exception_err(CPUHexagonState *env, |
| 40 | uint32_t exception, |
| 41 | uintptr_t pc) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 42 | { |
Taylor Simpson | 7d9ab20 | 2021-04-08 20:07:32 -0500 | [diff] [blame] | 43 | CPUState *cs = env_cpu(env); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 44 | qemu_log_mask(CPU_LOG_INT, "%s: %d\n", __func__, exception); |
| 45 | cs->exception_index = exception; |
| 46 | cpu_loop_exit_restore(cs, pc); |
| 47 | } |
| 48 | |
Marc-André Lureau | 8905770 | 2022-04-20 17:26:02 +0400 | [diff] [blame] | 49 | G_NORETURN void HELPER(raise_exception)(CPUHexagonState *env, uint32_t excp) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 50 | { |
Matheus Tavares Bernardino | e1b526f | 2024-05-03 13:53:15 -0300 | [diff] [blame] | 51 | hexagon_raise_exception_err(env, excp, 0); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 52 | } |
| 53 | |
Paolo Montesel | 7e8b3b3 | 2022-09-23 19:38:24 +0200 | [diff] [blame] | 54 | void log_store32(CPUHexagonState *env, target_ulong addr, |
| 55 | target_ulong val, int width, int slot) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 56 | { |
| 57 | HEX_DEBUG_LOG("log_store%d(0x" TARGET_FMT_lx |
| 58 | ", %" PRId32 " [0x08%" PRIx32 "])\n", |
| 59 | width, addr, val, val); |
| 60 | env->mem_log_stores[slot].va = addr; |
| 61 | env->mem_log_stores[slot].width = width; |
| 62 | env->mem_log_stores[slot].data32 = val; |
| 63 | } |
| 64 | |
Paolo Montesel | 7e8b3b3 | 2022-09-23 19:38:24 +0200 | [diff] [blame] | 65 | void log_store64(CPUHexagonState *env, target_ulong addr, |
| 66 | int64_t val, int width, int slot) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 67 | { |
| 68 | HEX_DEBUG_LOG("log_store%d(0x" TARGET_FMT_lx |
| 69 | ", %" PRId64 " [0x016%" PRIx64 "])\n", |
| 70 | width, addr, val, val); |
| 71 | env->mem_log_stores[slot].va = addr; |
| 72 | env->mem_log_stores[slot].width = width; |
| 73 | env->mem_log_stores[slot].data64 = val; |
| 74 | } |
| 75 | |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 76 | /* Handy place to set a breakpoint */ |
| 77 | void HELPER(debug_start_packet)(CPUHexagonState *env) |
| 78 | { |
| 79 | HEX_DEBUG_LOG("Start packet: pc = 0x" TARGET_FMT_lx "\n", |
| 80 | env->gpr[HEX_REG_PC]); |
| 81 | |
| 82 | for (int i = 0; i < TOTAL_PER_THREAD_REGS; i++) { |
| 83 | env->reg_written[i] = 0; |
| 84 | } |
| 85 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 86 | |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 87 | /* Checks for bookkeeping errors between disassembly context and runtime */ |
| 88 | void HELPER(debug_check_store_width)(CPUHexagonState *env, int slot, int check) |
| 89 | { |
| 90 | if (env->mem_log_stores[slot].width != check) { |
| 91 | HEX_DEBUG_LOG("ERROR: %d != %d\n", |
| 92 | env->mem_log_stores[slot].width, check); |
| 93 | g_assert_not_reached(); |
| 94 | } |
| 95 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 96 | |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 97 | static void commit_store(CPUHexagonState *env, int slot_num, uintptr_t ra) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 98 | { |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 99 | uint8_t width = env->mem_log_stores[slot_num].width; |
| 100 | target_ulong va = env->mem_log_stores[slot_num].va; |
| 101 | |
| 102 | switch (width) { |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 103 | case 1: |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 104 | cpu_stb_data_ra(env, va, env->mem_log_stores[slot_num].data32, ra); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 105 | break; |
| 106 | case 2: |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 107 | cpu_stw_data_ra(env, va, env->mem_log_stores[slot_num].data32, ra); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 108 | break; |
| 109 | case 4: |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 110 | cpu_stl_data_ra(env, va, env->mem_log_stores[slot_num].data32, ra); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 111 | break; |
| 112 | case 8: |
Taylor Simpson | 4699a92 | 2021-07-13 10:51:33 -0500 | [diff] [blame] | 113 | cpu_stq_data_ra(env, va, env->mem_log_stores[slot_num].data64, ra); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 114 | break; |
| 115 | default: |
| 116 | g_assert_not_reached(); |
| 117 | } |
| 118 | } |
| 119 | |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 120 | void HELPER(commit_store)(CPUHexagonState *env, int slot_num) |
| 121 | { |
| 122 | uintptr_t ra = GETPC(); |
| 123 | commit_store(env, slot_num, ra); |
| 124 | } |
| 125 | |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 126 | void HELPER(gather_store)(CPUHexagonState *env, uint32_t addr, int slot) |
| 127 | { |
| 128 | mem_gather_store(env, addr, slot); |
| 129 | } |
| 130 | |
| 131 | void HELPER(commit_hvx_stores)(CPUHexagonState *env) |
| 132 | { |
| 133 | uintptr_t ra = GETPC(); |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 134 | |
| 135 | /* Normal (possibly masked) vector store */ |
Brian Cain | 20c34a9 | 2023-10-08 15:09:44 -0700 | [diff] [blame] | 136 | for (int i = 0; i < VSTORES_MAX; i++) { |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 137 | if (env->vstore_pending[i]) { |
| 138 | env->vstore_pending[i] = 0; |
| 139 | target_ulong va = env->vstore[i].va; |
| 140 | int size = env->vstore[i].size; |
| 141 | for (int j = 0; j < size; j++) { |
| 142 | if (test_bit(j, env->vstore[i].mask)) { |
| 143 | cpu_stb_data_ra(env, va + j, env->vstore[i].data.ub[j], ra); |
| 144 | } |
| 145 | } |
| 146 | } |
| 147 | } |
| 148 | |
| 149 | /* Scatter store */ |
| 150 | if (env->vtcm_pending) { |
| 151 | env->vtcm_pending = false; |
| 152 | if (env->vtcm_log.op) { |
| 153 | /* Need to perform the scatter read/modify/write at commit time */ |
| 154 | if (env->vtcm_log.op_size == 2) { |
| 155 | SCATTER_OP_WRITE_TO_MEM(uint16_t); |
| 156 | } else if (env->vtcm_log.op_size == 4) { |
| 157 | /* Word Scatter += */ |
| 158 | SCATTER_OP_WRITE_TO_MEM(uint32_t); |
| 159 | } else { |
| 160 | g_assert_not_reached(); |
| 161 | } |
| 162 | } else { |
Brian Cain | 20c34a9 | 2023-10-08 15:09:44 -0700 | [diff] [blame] | 163 | for (int i = 0; i < sizeof(MMVector); i++) { |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 164 | if (test_bit(i, env->vtcm_log.mask)) { |
| 165 | cpu_stb_data_ra(env, env->vtcm_log.va[i], |
| 166 | env->vtcm_log.data.ub[i], ra); |
| 167 | clear_bit(i, env->vtcm_log.mask); |
| 168 | env->vtcm_log.data.ub[i] = 0; |
| 169 | } |
| 170 | |
| 171 | } |
| 172 | } |
| 173 | } |
| 174 | } |
| 175 | |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 176 | static void print_store(CPUHexagonState *env, int slot) |
| 177 | { |
| 178 | if (!(env->slot_cancelled & (1 << slot))) { |
| 179 | uint8_t width = env->mem_log_stores[slot].width; |
| 180 | if (width == 1) { |
| 181 | uint32_t data = env->mem_log_stores[slot].data32 & 0xff; |
| 182 | HEX_DEBUG_LOG("\tmemb[0x" TARGET_FMT_lx "] = %" PRId32 |
| 183 | " (0x%02" PRIx32 ")\n", |
| 184 | env->mem_log_stores[slot].va, data, data); |
| 185 | } else if (width == 2) { |
| 186 | uint32_t data = env->mem_log_stores[slot].data32 & 0xffff; |
| 187 | HEX_DEBUG_LOG("\tmemh[0x" TARGET_FMT_lx "] = %" PRId32 |
| 188 | " (0x%04" PRIx32 ")\n", |
| 189 | env->mem_log_stores[slot].va, data, data); |
| 190 | } else if (width == 4) { |
| 191 | uint32_t data = env->mem_log_stores[slot].data32; |
| 192 | HEX_DEBUG_LOG("\tmemw[0x" TARGET_FMT_lx "] = %" PRId32 |
| 193 | " (0x%08" PRIx32 ")\n", |
| 194 | env->mem_log_stores[slot].va, data, data); |
| 195 | } else if (width == 8) { |
| 196 | HEX_DEBUG_LOG("\tmemd[0x" TARGET_FMT_lx "] = %" PRId64 |
| 197 | " (0x%016" PRIx64 ")\n", |
| 198 | env->mem_log_stores[slot].va, |
| 199 | env->mem_log_stores[slot].data64, |
| 200 | env->mem_log_stores[slot].data64); |
| 201 | } else { |
| 202 | HEX_DEBUG_LOG("\tBad store width %d\n", width); |
| 203 | g_assert_not_reached(); |
| 204 | } |
| 205 | } |
| 206 | } |
| 207 | |
| 208 | /* This function is a handy place to set a breakpoint */ |
Taylor Simpson | 0fc56c4 | 2023-04-27 16:00:12 -0700 | [diff] [blame] | 209 | void HELPER(debug_commit_end)(CPUHexagonState *env, uint32_t this_PC, |
Taylor Simpson | 842b206 | 2023-04-27 16:00:10 -0700 | [diff] [blame] | 210 | int pred_written, int has_st0, int has_st1) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 211 | { |
| 212 | bool reg_printed = false; |
| 213 | bool pred_printed = false; |
| 214 | int i; |
| 215 | |
Taylor Simpson | 0fc56c4 | 2023-04-27 16:00:12 -0700 | [diff] [blame] | 216 | HEX_DEBUG_LOG("Packet committed: pc = 0x" TARGET_FMT_lx "\n", this_PC); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 217 | HEX_DEBUG_LOG("slot_cancelled = %d\n", env->slot_cancelled); |
| 218 | |
| 219 | for (i = 0; i < TOTAL_PER_THREAD_REGS; i++) { |
| 220 | if (env->reg_written[i]) { |
| 221 | if (!reg_printed) { |
| 222 | HEX_DEBUG_LOG("Regs written\n"); |
| 223 | reg_printed = true; |
| 224 | } |
| 225 | HEX_DEBUG_LOG("\tr%d = " TARGET_FMT_ld " (0x" TARGET_FMT_lx ")\n", |
Taylor Simpson | d54c561 | 2023-04-27 16:00:02 -0700 | [diff] [blame] | 226 | i, env->gpr[i], env->gpr[i]); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 227 | } |
| 228 | } |
| 229 | |
| 230 | for (i = 0; i < NUM_PREGS; i++) { |
Taylor Simpson | 842b206 | 2023-04-27 16:00:10 -0700 | [diff] [blame] | 231 | if (pred_written & (1 << i)) { |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 232 | if (!pred_printed) { |
| 233 | HEX_DEBUG_LOG("Predicates written\n"); |
| 234 | pred_printed = true; |
| 235 | } |
| 236 | HEX_DEBUG_LOG("\tp%d = 0x" TARGET_FMT_lx "\n", |
Taylor Simpson | e22edc7 | 2023-04-27 16:00:09 -0700 | [diff] [blame] | 237 | i, env->pred[i]); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 238 | } |
| 239 | } |
| 240 | |
| 241 | if (has_st0 || has_st1) { |
| 242 | HEX_DEBUG_LOG("Stores\n"); |
| 243 | if (has_st0) { |
| 244 | print_store(env, 0); |
| 245 | } |
| 246 | if (has_st1) { |
| 247 | print_store(env, 1); |
| 248 | } |
| 249 | } |
| 250 | |
Taylor Simpson | 613653e | 2022-11-08 08:29:01 -0800 | [diff] [blame] | 251 | HEX_DEBUG_LOG("Next PC = " TARGET_FMT_lx "\n", env->gpr[HEX_REG_PC]); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 252 | HEX_DEBUG_LOG("Exec counters: pkt = " TARGET_FMT_lx |
| 253 | ", insn = " TARGET_FMT_lx |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 254 | ", hvx = " TARGET_FMT_lx "\n", |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 255 | env->gpr[HEX_REG_QEMU_PKT_CNT], |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 256 | env->gpr[HEX_REG_QEMU_INSN_CNT], |
| 257 | env->gpr[HEX_REG_QEMU_HVX_CNT]); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 258 | |
| 259 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 260 | |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 261 | int32_t HELPER(fcircadd)(int32_t RxV, int32_t offset, int32_t M, int32_t CS) |
| 262 | { |
Michael Lambert | 58ff298 | 2022-02-09 18:15:45 -0800 | [diff] [blame] | 263 | uint32_t K_const = extract32(M, 24, 4); |
| 264 | uint32_t length = extract32(M, 0, 17); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 265 | uint32_t new_ptr = RxV + offset; |
Taylor Simpson | 46ef47e | 2021-04-08 20:07:50 -0500 | [diff] [blame] | 266 | uint32_t start_addr; |
| 267 | uint32_t end_addr; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 268 | |
| 269 | if (K_const == 0 && length >= 4) { |
Taylor Simpson | 46ef47e | 2021-04-08 20:07:50 -0500 | [diff] [blame] | 270 | start_addr = CS; |
| 271 | end_addr = start_addr + length; |
| 272 | } else { |
| 273 | /* |
| 274 | * Versions v3 and earlier used the K value to specify a power-of-2 size |
| 275 | * 2^(K+2) that is greater than the buffer length |
| 276 | */ |
| 277 | int32_t mask = (1 << (K_const + 2)) - 1; |
| 278 | start_addr = RxV & (~mask); |
| 279 | end_addr = start_addr | length; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 280 | } |
| 281 | |
| 282 | if (new_ptr >= end_addr) { |
| 283 | new_ptr -= length; |
| 284 | } else if (new_ptr < start_addr) { |
| 285 | new_ptr += length; |
| 286 | } |
| 287 | |
| 288 | return new_ptr; |
| 289 | } |
| 290 | |
Taylor Simpson | af7f182 | 2021-04-08 20:07:51 -0500 | [diff] [blame] | 291 | uint32_t HELPER(fbrev)(uint32_t addr) |
| 292 | { |
| 293 | /* |
| 294 | * Bit reverse the low 16 bits of the address |
| 295 | */ |
| 296 | return deposit32(addr, 0, 16, revbit16(addr)); |
| 297 | } |
| 298 | |
Taylor Simpson | d934c16 | 2021-04-08 20:07:45 -0500 | [diff] [blame] | 299 | static float32 build_float32(uint8_t sign, uint32_t exp, uint32_t mant) |
| 300 | { |
| 301 | return make_float32( |
| 302 | ((sign & 1) << 31) | |
| 303 | ((exp & 0xff) << SF_MANTBITS) | |
| 304 | (mant & ((1 << SF_MANTBITS) - 1))); |
| 305 | } |
| 306 | |
| 307 | /* |
| 308 | * sfrecipa, sfinvsqrta have two 32-bit results |
| 309 | * r0,p0=sfrecipa(r1,r2) |
| 310 | * r0,p0=sfinvsqrta(r1) |
| 311 | * |
| 312 | * Since helpers can only return a single value, we pack the two results |
| 313 | * into a 64-bit value. |
| 314 | */ |
| 315 | uint64_t HELPER(sfrecipa)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 316 | { |
| 317 | int32_t PeV = 0; |
| 318 | float32 RdV; |
| 319 | int idx; |
| 320 | int adjust; |
| 321 | int mant; |
| 322 | int exp; |
| 323 | |
| 324 | arch_fpop_start(env); |
| 325 | if (arch_sf_recip_common(&RsV, &RtV, &RdV, &adjust, &env->fp_status)) { |
| 326 | PeV = adjust; |
| 327 | idx = (RtV >> 16) & 0x7f; |
| 328 | mant = (recip_lookup_table[idx] << 15) | 1; |
| 329 | exp = SF_BIAS - (float32_getexp(RtV) - SF_BIAS) - 1; |
| 330 | RdV = build_float32(extract32(RtV, 31, 1), exp, mant); |
| 331 | } |
| 332 | arch_fpop_end(env); |
| 333 | return ((uint64_t)RdV << 32) | PeV; |
| 334 | } |
| 335 | |
Taylor Simpson | dd8705b | 2021-04-08 20:07:46 -0500 | [diff] [blame] | 336 | uint64_t HELPER(sfinvsqrta)(CPUHexagonState *env, float32 RsV) |
| 337 | { |
| 338 | int PeV = 0; |
| 339 | float32 RdV; |
| 340 | int idx; |
| 341 | int adjust; |
| 342 | int mant; |
| 343 | int exp; |
| 344 | |
| 345 | arch_fpop_start(env); |
| 346 | if (arch_sf_invsqrt_common(&RsV, &RdV, &adjust, &env->fp_status)) { |
| 347 | PeV = adjust; |
| 348 | idx = (RsV >> 17) & 0x7f; |
| 349 | mant = (invsqrt_lookup_table[idx] << 15); |
| 350 | exp = SF_BIAS - ((float32_getexp(RsV) - SF_BIAS) >> 1) - 1; |
| 351 | RdV = build_float32(extract32(RsV, 31, 1), exp, mant); |
| 352 | } |
| 353 | arch_fpop_end(env); |
| 354 | return ((uint64_t)RdV << 32) | PeV; |
| 355 | } |
| 356 | |
Taylor Simpson | da74cd2 | 2021-04-08 20:07:47 -0500 | [diff] [blame] | 357 | int64_t HELPER(vacsh_val)(CPUHexagonState *env, |
Taylor Simpson | d54c561 | 2023-04-27 16:00:02 -0700 | [diff] [blame] | 358 | int64_t RxxV, int64_t RssV, int64_t RttV, |
| 359 | uint32_t pkt_need_commit) |
Taylor Simpson | da74cd2 | 2021-04-08 20:07:47 -0500 | [diff] [blame] | 360 | { |
| 361 | for (int i = 0; i < 4; i++) { |
| 362 | int xv = sextract64(RxxV, i * 16, 16); |
| 363 | int sv = sextract64(RssV, i * 16, 16); |
| 364 | int tv = sextract64(RttV, i * 16, 16); |
| 365 | int max; |
| 366 | xv = xv + tv; |
| 367 | sv = sv - tv; |
| 368 | max = xv > sv ? xv : sv; |
| 369 | /* Note that fSATH can set the OVF bit in usr */ |
| 370 | RxxV = deposit64(RxxV, i * 16, 16, fSATH(max)); |
| 371 | } |
| 372 | return RxxV; |
| 373 | } |
| 374 | |
| 375 | int32_t HELPER(vacsh_pred)(CPUHexagonState *env, |
| 376 | int64_t RxxV, int64_t RssV, int64_t RttV) |
| 377 | { |
| 378 | int32_t PeV = 0; |
| 379 | for (int i = 0; i < 4; i++) { |
| 380 | int xv = sextract64(RxxV, i * 16, 16); |
| 381 | int sv = sextract64(RssV, i * 16, 16); |
| 382 | int tv = sextract64(RttV, i * 16, 16); |
| 383 | xv = xv + tv; |
| 384 | sv = sv - tv; |
| 385 | PeV = deposit32(PeV, i * 2, 1, (xv > sv)); |
| 386 | PeV = deposit32(PeV, i * 2 + 1, 1, (xv > sv)); |
| 387 | } |
| 388 | return PeV; |
| 389 | } |
| 390 | |
Taylor Simpson | d24f0b2 | 2023-04-27 15:59:58 -0700 | [diff] [blame] | 391 | int64_t HELPER(cabacdecbin_val)(int64_t RssV, int64_t RttV) |
| 392 | { |
| 393 | int64_t RddV = 0; |
| 394 | size4u_t state; |
| 395 | size4u_t valMPS; |
| 396 | size4u_t bitpos; |
| 397 | size4u_t range; |
| 398 | size4u_t offset; |
| 399 | size4u_t rLPS; |
| 400 | size4u_t rMPS; |
| 401 | |
| 402 | state = fEXTRACTU_RANGE(fGETWORD(1, RttV), 5, 0); |
| 403 | valMPS = fEXTRACTU_RANGE(fGETWORD(1, RttV), 8, 8); |
| 404 | bitpos = fEXTRACTU_RANGE(fGETWORD(0, RttV), 4, 0); |
| 405 | range = fGETWORD(0, RssV); |
| 406 | offset = fGETWORD(1, RssV); |
| 407 | |
| 408 | /* calculate rLPS */ |
| 409 | range <<= bitpos; |
| 410 | offset <<= bitpos; |
| 411 | rLPS = rLPS_table_64x4[state][(range >> 29) & 3]; |
| 412 | rLPS = rLPS << 23; /* left aligned */ |
| 413 | |
| 414 | /* calculate rMPS */ |
| 415 | rMPS = (range & 0xff800000) - rLPS; |
| 416 | |
| 417 | /* most probable region */ |
| 418 | if (offset < rMPS) { |
| 419 | RddV = AC_next_state_MPS_64[state]; |
| 420 | fINSERT_RANGE(RddV, 8, 8, valMPS); |
| 421 | fINSERT_RANGE(RddV, 31, 23, (rMPS >> 23)); |
| 422 | fSETWORD(1, RddV, offset); |
| 423 | } |
| 424 | /* least probable region */ |
| 425 | else { |
| 426 | RddV = AC_next_state_LPS_64[state]; |
| 427 | fINSERT_RANGE(RddV, 8, 8, ((!state) ? (1 - valMPS) : (valMPS))); |
| 428 | fINSERT_RANGE(RddV, 31, 23, (rLPS >> 23)); |
| 429 | fSETWORD(1, RddV, (offset - rMPS)); |
| 430 | } |
| 431 | return RddV; |
| 432 | } |
| 433 | |
| 434 | int32_t HELPER(cabacdecbin_pred)(int64_t RssV, int64_t RttV) |
| 435 | { |
| 436 | int32_t p0 = 0; |
| 437 | size4u_t state; |
| 438 | size4u_t valMPS; |
| 439 | size4u_t bitpos; |
| 440 | size4u_t range; |
| 441 | size4u_t offset; |
| 442 | size4u_t rLPS; |
| 443 | size4u_t rMPS; |
| 444 | |
| 445 | state = fEXTRACTU_RANGE(fGETWORD(1, RttV), 5, 0); |
| 446 | valMPS = fEXTRACTU_RANGE(fGETWORD(1, RttV), 8, 8); |
| 447 | bitpos = fEXTRACTU_RANGE(fGETWORD(0, RttV), 4, 0); |
| 448 | range = fGETWORD(0, RssV); |
| 449 | offset = fGETWORD(1, RssV); |
| 450 | |
| 451 | /* calculate rLPS */ |
| 452 | range <<= bitpos; |
| 453 | offset <<= bitpos; |
| 454 | rLPS = rLPS_table_64x4[state][(range >> 29) & 3]; |
| 455 | rLPS = rLPS << 23; /* left aligned */ |
| 456 | |
| 457 | /* calculate rMPS */ |
| 458 | rMPS = (range & 0xff800000) - rLPS; |
| 459 | |
| 460 | /* most probable region */ |
| 461 | if (offset < rMPS) { |
| 462 | p0 = valMPS; |
| 463 | |
| 464 | } |
| 465 | /* least probable region */ |
| 466 | else { |
| 467 | p0 = valMPS ^ 1; |
| 468 | } |
| 469 | return p0; |
| 470 | } |
| 471 | |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 472 | static void probe_store(CPUHexagonState *env, int slot, int mmu_idx, |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 473 | bool is_predicated, uintptr_t retaddr) |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 474 | { |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 475 | if (!is_predicated || !(env->slot_cancelled & (1 << slot))) { |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 476 | size1u_t width = env->mem_log_stores[slot].width; |
| 477 | target_ulong va = env->mem_log_stores[slot].va; |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 478 | probe_write(env, va, width, mmu_idx, retaddr); |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 479 | } |
| 480 | } |
| 481 | |
Taylor Simpson | 15fc6ba | 2022-07-07 14:05:46 -0700 | [diff] [blame] | 482 | /* |
| 483 | * Called from a mem_noshuf packet to make sure the load doesn't |
| 484 | * raise an exception |
| 485 | */ |
| 486 | void HELPER(probe_noshuf_load)(CPUHexagonState *env, target_ulong va, |
| 487 | int size, int mmu_idx) |
| 488 | { |
| 489 | uintptr_t retaddr = GETPC(); |
| 490 | probe_read(env, va, size, mmu_idx, retaddr); |
| 491 | } |
| 492 | |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 493 | /* Called during packet commit when there are two scalar stores */ |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 494 | void HELPER(probe_pkt_scalar_store_s0)(CPUHexagonState *env, int args) |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 495 | { |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 496 | int mmu_idx = FIELD_EX32(args, PROBE_PKT_SCALAR_STORE_S0, MMU_IDX); |
| 497 | bool is_predicated = |
| 498 | FIELD_EX32(args, PROBE_PKT_SCALAR_STORE_S0, IS_PREDICATED); |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 499 | uintptr_t ra = GETPC(); |
| 500 | probe_store(env, 0, mmu_idx, is_predicated, ra); |
Taylor Simpson | c23b576 | 2021-09-22 10:30:46 -0500 | [diff] [blame] | 501 | } |
| 502 | |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 503 | static void probe_hvx_stores(CPUHexagonState *env, int mmu_idx, |
| 504 | uintptr_t retaddr) |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 505 | { |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 506 | /* Normal (possibly masked) vector store */ |
Brian Cain | 20c34a9 | 2023-10-08 15:09:44 -0700 | [diff] [blame] | 507 | for (int i = 0; i < VSTORES_MAX; i++) { |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 508 | if (env->vstore_pending[i]) { |
| 509 | target_ulong va = env->vstore[i].va; |
| 510 | int size = env->vstore[i].size; |
| 511 | for (int j = 0; j < size; j++) { |
| 512 | if (test_bit(j, env->vstore[i].mask)) { |
| 513 | probe_write(env, va + j, 1, mmu_idx, retaddr); |
| 514 | } |
| 515 | } |
| 516 | } |
| 517 | } |
| 518 | |
| 519 | /* Scatter store */ |
| 520 | if (env->vtcm_pending) { |
| 521 | if (env->vtcm_log.op) { |
| 522 | /* Need to perform the scatter read/modify/write at commit time */ |
| 523 | if (env->vtcm_log.op_size == 2) { |
| 524 | SCATTER_OP_PROBE_MEM(size2u_t, mmu_idx, retaddr); |
| 525 | } else if (env->vtcm_log.op_size == 4) { |
| 526 | /* Word Scatter += */ |
| 527 | SCATTER_OP_PROBE_MEM(size4u_t, mmu_idx, retaddr); |
| 528 | } else { |
| 529 | g_assert_not_reached(); |
| 530 | } |
| 531 | } else { |
| 532 | for (int i = 0; i < sizeof(MMVector); i++) { |
| 533 | if (test_bit(i, env->vtcm_log.mask)) { |
| 534 | probe_write(env, env->vtcm_log.va[i], 1, mmu_idx, retaddr); |
| 535 | } |
| 536 | |
| 537 | } |
| 538 | } |
| 539 | } |
| 540 | } |
| 541 | |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 542 | void HELPER(probe_hvx_stores)(CPUHexagonState *env, int mmu_idx) |
| 543 | { |
| 544 | uintptr_t retaddr = GETPC(); |
| 545 | probe_hvx_stores(env, mmu_idx, retaddr); |
| 546 | } |
| 547 | |
Taylor Simpson | 2bda44e | 2023-04-05 09:42:10 -0700 | [diff] [blame] | 548 | void HELPER(probe_pkt_scalar_hvx_stores)(CPUHexagonState *env, int mask) |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 549 | { |
Taylor Simpson | 7b84fd0 | 2023-03-06 18:58:27 -0800 | [diff] [blame] | 550 | bool has_st0 = FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, HAS_ST0); |
| 551 | bool has_st1 = FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, HAS_ST1); |
| 552 | bool has_hvx_stores = |
| 553 | FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, HAS_HVX_STORES); |
| 554 | bool s0_is_pred = FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, S0_IS_PRED); |
| 555 | bool s1_is_pred = FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, S1_IS_PRED); |
Taylor Simpson | 2bda44e | 2023-04-05 09:42:10 -0700 | [diff] [blame] | 556 | int mmu_idx = FIELD_EX32(mask, PROBE_PKT_SCALAR_HVX_STORES, MMU_IDX); |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 557 | uintptr_t ra = GETPC(); |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 558 | |
| 559 | if (has_st0) { |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 560 | probe_store(env, 0, mmu_idx, s0_is_pred, ra); |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 561 | } |
| 562 | if (has_st1) { |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 563 | probe_store(env, 1, mmu_idx, s1_is_pred, ra); |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 564 | } |
| 565 | if (has_hvx_stores) { |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 566 | probe_hvx_stores(env, mmu_idx, ra); |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 567 | } |
| 568 | } |
| 569 | |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 570 | #ifndef CONFIG_HEXAGON_IDEF_PARSER |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 571 | /* |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 572 | * mem_noshuf |
| 573 | * Section 5.5 of the Hexagon V67 Programmer's Reference Manual |
| 574 | * |
| 575 | * If the load is in slot 0 and there is a store in slot1 (that |
| 576 | * wasn't cancelled), we have to do the store first. |
| 577 | */ |
Taylor Simpson | e5d0d78 | 2023-04-27 16:00:11 -0700 | [diff] [blame] | 578 | static void check_noshuf(CPUHexagonState *env, bool pkt_has_store_s1, |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 579 | uint32_t slot, target_ulong vaddr, int size, |
| 580 | uintptr_t ra) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 581 | { |
Taylor Simpson | e5d0d78 | 2023-04-27 16:00:11 -0700 | [diff] [blame] | 582 | if (slot == 0 && pkt_has_store_s1 && |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 583 | ((env->slot_cancelled & (1 << 1)) == 0)) { |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 584 | probe_read(env, vaddr, size, MMU_USER_IDX, ra); |
| 585 | commit_store(env, 1, ra); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 586 | } |
| 587 | } |
Matheus Tavares Bernardino | 3bd8359 | 2023-10-08 15:09:43 -0700 | [diff] [blame] | 588 | #endif |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 589 | |
| 590 | /* Floating point */ |
| 591 | float64 HELPER(conv_sf2df)(CPUHexagonState *env, float32 RsV) |
| 592 | { |
| 593 | float64 out_f64; |
| 594 | arch_fpop_start(env); |
| 595 | out_f64 = float32_to_float64(RsV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 596 | arch_fpop_end(env); |
| 597 | return out_f64; |
| 598 | } |
| 599 | |
| 600 | float32 HELPER(conv_df2sf)(CPUHexagonState *env, float64 RssV) |
| 601 | { |
| 602 | float32 out_f32; |
| 603 | arch_fpop_start(env); |
| 604 | out_f32 = float64_to_float32(RssV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 605 | arch_fpop_end(env); |
| 606 | return out_f32; |
| 607 | } |
| 608 | |
| 609 | float32 HELPER(conv_uw2sf)(CPUHexagonState *env, int32_t RsV) |
| 610 | { |
| 611 | float32 RdV; |
| 612 | arch_fpop_start(env); |
| 613 | RdV = uint32_to_float32(RsV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 614 | arch_fpop_end(env); |
| 615 | return RdV; |
| 616 | } |
| 617 | |
| 618 | float64 HELPER(conv_uw2df)(CPUHexagonState *env, int32_t RsV) |
| 619 | { |
| 620 | float64 RddV; |
| 621 | arch_fpop_start(env); |
| 622 | RddV = uint32_to_float64(RsV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 623 | arch_fpop_end(env); |
| 624 | return RddV; |
| 625 | } |
| 626 | |
| 627 | float32 HELPER(conv_w2sf)(CPUHexagonState *env, int32_t RsV) |
| 628 | { |
| 629 | float32 RdV; |
| 630 | arch_fpop_start(env); |
| 631 | RdV = int32_to_float32(RsV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 632 | arch_fpop_end(env); |
| 633 | return RdV; |
| 634 | } |
| 635 | |
| 636 | float64 HELPER(conv_w2df)(CPUHexagonState *env, int32_t RsV) |
| 637 | { |
| 638 | float64 RddV; |
| 639 | arch_fpop_start(env); |
| 640 | RddV = int32_to_float64(RsV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 641 | arch_fpop_end(env); |
| 642 | return RddV; |
| 643 | } |
| 644 | |
| 645 | float32 HELPER(conv_ud2sf)(CPUHexagonState *env, int64_t RssV) |
| 646 | { |
| 647 | float32 RdV; |
| 648 | arch_fpop_start(env); |
| 649 | RdV = uint64_to_float32(RssV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 650 | arch_fpop_end(env); |
| 651 | return RdV; |
| 652 | } |
| 653 | |
| 654 | float64 HELPER(conv_ud2df)(CPUHexagonState *env, int64_t RssV) |
| 655 | { |
| 656 | float64 RddV; |
| 657 | arch_fpop_start(env); |
| 658 | RddV = uint64_to_float64(RssV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 659 | arch_fpop_end(env); |
| 660 | return RddV; |
| 661 | } |
| 662 | |
| 663 | float32 HELPER(conv_d2sf)(CPUHexagonState *env, int64_t RssV) |
| 664 | { |
| 665 | float32 RdV; |
| 666 | arch_fpop_start(env); |
| 667 | RdV = int64_to_float32(RssV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 668 | arch_fpop_end(env); |
| 669 | return RdV; |
| 670 | } |
| 671 | |
| 672 | float64 HELPER(conv_d2df)(CPUHexagonState *env, int64_t RssV) |
| 673 | { |
| 674 | float64 RddV; |
| 675 | arch_fpop_start(env); |
| 676 | RddV = int64_to_float64(RssV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 677 | arch_fpop_end(env); |
| 678 | return RddV; |
| 679 | } |
| 680 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 681 | uint32_t HELPER(conv_sf2uw)(CPUHexagonState *env, float32 RsV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 682 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 683 | uint32_t RdV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 684 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 685 | /* Hexagon checks the sign before rounding */ |
| 686 | if (float32_is_neg(RsV) && !float32_is_any_nan(RsV)) { |
| 687 | float_raise(float_flag_invalid, &env->fp_status); |
| 688 | RdV = 0; |
| 689 | } else { |
| 690 | RdV = float32_to_uint32(RsV, &env->fp_status); |
| 691 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 692 | arch_fpop_end(env); |
| 693 | return RdV; |
| 694 | } |
| 695 | |
| 696 | int32_t HELPER(conv_sf2w)(CPUHexagonState *env, float32 RsV) |
| 697 | { |
| 698 | int32_t RdV; |
| 699 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 700 | /* Hexagon returns -1 for NaN */ |
| 701 | if (float32_is_any_nan(RsV)) { |
| 702 | float_raise(float_flag_invalid, &env->fp_status); |
| 703 | RdV = -1; |
| 704 | } else { |
| 705 | RdV = float32_to_int32(RsV, &env->fp_status); |
| 706 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 707 | arch_fpop_end(env); |
| 708 | return RdV; |
| 709 | } |
| 710 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 711 | uint64_t HELPER(conv_sf2ud)(CPUHexagonState *env, float32 RsV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 712 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 713 | uint64_t RddV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 714 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 715 | /* Hexagon checks the sign before rounding */ |
| 716 | if (float32_is_neg(RsV) && !float32_is_any_nan(RsV)) { |
| 717 | float_raise(float_flag_invalid, &env->fp_status); |
| 718 | RddV = 0; |
| 719 | } else { |
| 720 | RddV = float32_to_uint64(RsV, &env->fp_status); |
| 721 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 722 | arch_fpop_end(env); |
| 723 | return RddV; |
| 724 | } |
| 725 | |
| 726 | int64_t HELPER(conv_sf2d)(CPUHexagonState *env, float32 RsV) |
| 727 | { |
| 728 | int64_t RddV; |
| 729 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 730 | /* Hexagon returns -1 for NaN */ |
| 731 | if (float32_is_any_nan(RsV)) { |
| 732 | float_raise(float_flag_invalid, &env->fp_status); |
| 733 | RddV = -1; |
| 734 | } else { |
| 735 | RddV = float32_to_int64(RsV, &env->fp_status); |
| 736 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 737 | arch_fpop_end(env); |
| 738 | return RddV; |
| 739 | } |
| 740 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 741 | uint32_t HELPER(conv_df2uw)(CPUHexagonState *env, float64 RssV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 742 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 743 | uint32_t RdV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 744 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 745 | /* Hexagon checks the sign before rounding */ |
| 746 | if (float64_is_neg(RssV) && !float64_is_any_nan(RssV)) { |
| 747 | float_raise(float_flag_invalid, &env->fp_status); |
| 748 | RdV = 0; |
| 749 | } else { |
| 750 | RdV = float64_to_uint32(RssV, &env->fp_status); |
| 751 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 752 | arch_fpop_end(env); |
| 753 | return RdV; |
| 754 | } |
| 755 | |
| 756 | int32_t HELPER(conv_df2w)(CPUHexagonState *env, float64 RssV) |
| 757 | { |
| 758 | int32_t RdV; |
| 759 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 760 | /* Hexagon returns -1 for NaN */ |
| 761 | if (float64_is_any_nan(RssV)) { |
| 762 | float_raise(float_flag_invalid, &env->fp_status); |
| 763 | RdV = -1; |
| 764 | } else { |
| 765 | RdV = float64_to_int32(RssV, &env->fp_status); |
| 766 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 767 | arch_fpop_end(env); |
| 768 | return RdV; |
| 769 | } |
| 770 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 771 | uint64_t HELPER(conv_df2ud)(CPUHexagonState *env, float64 RssV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 772 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 773 | uint64_t RddV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 774 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 775 | /* Hexagon checks the sign before rounding */ |
| 776 | if (float64_is_neg(RssV) && !float64_is_any_nan(RssV)) { |
| 777 | float_raise(float_flag_invalid, &env->fp_status); |
| 778 | RddV = 0; |
| 779 | } else { |
| 780 | RddV = float64_to_uint64(RssV, &env->fp_status); |
| 781 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 782 | arch_fpop_end(env); |
| 783 | return RddV; |
| 784 | } |
| 785 | |
| 786 | int64_t HELPER(conv_df2d)(CPUHexagonState *env, float64 RssV) |
| 787 | { |
| 788 | int64_t RddV; |
| 789 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 790 | /* Hexagon returns -1 for NaN */ |
| 791 | if (float64_is_any_nan(RssV)) { |
| 792 | float_raise(float_flag_invalid, &env->fp_status); |
| 793 | RddV = -1; |
| 794 | } else { |
| 795 | RddV = float64_to_int64(RssV, &env->fp_status); |
| 796 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 797 | arch_fpop_end(env); |
| 798 | return RddV; |
| 799 | } |
| 800 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 801 | uint32_t HELPER(conv_sf2uw_chop)(CPUHexagonState *env, float32 RsV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 802 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 803 | uint32_t RdV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 804 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 805 | /* Hexagon checks the sign before rounding */ |
| 806 | if (float32_is_neg(RsV) && !float32_is_any_nan(RsV)) { |
| 807 | float_raise(float_flag_invalid, &env->fp_status); |
| 808 | RdV = 0; |
| 809 | } else { |
| 810 | RdV = float32_to_uint32_round_to_zero(RsV, &env->fp_status); |
| 811 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 812 | arch_fpop_end(env); |
| 813 | return RdV; |
| 814 | } |
| 815 | |
| 816 | int32_t HELPER(conv_sf2w_chop)(CPUHexagonState *env, float32 RsV) |
| 817 | { |
| 818 | int32_t RdV; |
| 819 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 820 | /* Hexagon returns -1 for NaN */ |
| 821 | if (float32_is_any_nan(RsV)) { |
| 822 | float_raise(float_flag_invalid, &env->fp_status); |
| 823 | RdV = -1; |
| 824 | } else { |
| 825 | RdV = float32_to_int32_round_to_zero(RsV, &env->fp_status); |
| 826 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 827 | arch_fpop_end(env); |
| 828 | return RdV; |
| 829 | } |
| 830 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 831 | uint64_t HELPER(conv_sf2ud_chop)(CPUHexagonState *env, float32 RsV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 832 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 833 | uint64_t RddV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 834 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 835 | /* Hexagon checks the sign before rounding */ |
| 836 | if (float32_is_neg(RsV) && !float32_is_any_nan(RsV)) { |
| 837 | float_raise(float_flag_invalid, &env->fp_status); |
| 838 | RddV = 0; |
| 839 | } else { |
| 840 | RddV = float32_to_uint64_round_to_zero(RsV, &env->fp_status); |
| 841 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 842 | arch_fpop_end(env); |
| 843 | return RddV; |
| 844 | } |
| 845 | |
| 846 | int64_t HELPER(conv_sf2d_chop)(CPUHexagonState *env, float32 RsV) |
| 847 | { |
| 848 | int64_t RddV; |
| 849 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 850 | /* Hexagon returns -1 for NaN */ |
| 851 | if (float32_is_any_nan(RsV)) { |
| 852 | float_raise(float_flag_invalid, &env->fp_status); |
| 853 | RddV = -1; |
| 854 | } else { |
| 855 | RddV = float32_to_int64_round_to_zero(RsV, &env->fp_status); |
| 856 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 857 | arch_fpop_end(env); |
| 858 | return RddV; |
| 859 | } |
| 860 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 861 | uint32_t HELPER(conv_df2uw_chop)(CPUHexagonState *env, float64 RssV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 862 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 863 | uint32_t RdV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 864 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 865 | /* Hexagon checks the sign before rounding */ |
Taylor Simpson | 3977ba3 | 2022-02-09 18:15:54 -0800 | [diff] [blame] | 866 | if (float64_is_neg(RssV) && !float64_is_any_nan(RssV)) { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 867 | float_raise(float_flag_invalid, &env->fp_status); |
| 868 | RdV = 0; |
| 869 | } else { |
| 870 | RdV = float64_to_uint32_round_to_zero(RssV, &env->fp_status); |
| 871 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 872 | arch_fpop_end(env); |
| 873 | return RdV; |
| 874 | } |
| 875 | |
| 876 | int32_t HELPER(conv_df2w_chop)(CPUHexagonState *env, float64 RssV) |
| 877 | { |
| 878 | int32_t RdV; |
| 879 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 880 | /* Hexagon returns -1 for NaN */ |
| 881 | if (float64_is_any_nan(RssV)) { |
| 882 | float_raise(float_flag_invalid, &env->fp_status); |
| 883 | RdV = -1; |
| 884 | } else { |
| 885 | RdV = float64_to_int32_round_to_zero(RssV, &env->fp_status); |
| 886 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 887 | arch_fpop_end(env); |
| 888 | return RdV; |
| 889 | } |
| 890 | |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 891 | uint64_t HELPER(conv_df2ud_chop)(CPUHexagonState *env, float64 RssV) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 892 | { |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 893 | uint64_t RddV; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 894 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 895 | /* Hexagon checks the sign before rounding */ |
| 896 | if (float64_is_neg(RssV) && !float64_is_any_nan(RssV)) { |
| 897 | float_raise(float_flag_invalid, &env->fp_status); |
| 898 | RddV = 0; |
| 899 | } else { |
| 900 | RddV = float64_to_uint64_round_to_zero(RssV, &env->fp_status); |
| 901 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 902 | arch_fpop_end(env); |
| 903 | return RddV; |
| 904 | } |
| 905 | |
| 906 | int64_t HELPER(conv_df2d_chop)(CPUHexagonState *env, float64 RssV) |
| 907 | { |
| 908 | int64_t RddV; |
| 909 | arch_fpop_start(env); |
Taylor Simpson | b3f37ab | 2021-04-08 20:07:40 -0500 | [diff] [blame] | 910 | /* Hexagon returns -1 for NaN */ |
| 911 | if (float64_is_any_nan(RssV)) { |
| 912 | float_raise(float_flag_invalid, &env->fp_status); |
| 913 | RddV = -1; |
| 914 | } else { |
| 915 | RddV = float64_to_int64_round_to_zero(RssV, &env->fp_status); |
| 916 | } |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 917 | arch_fpop_end(env); |
| 918 | return RddV; |
| 919 | } |
| 920 | |
| 921 | float32 HELPER(sfadd)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 922 | { |
| 923 | float32 RdV; |
| 924 | arch_fpop_start(env); |
| 925 | RdV = float32_add(RsV, RtV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 926 | arch_fpop_end(env); |
| 927 | return RdV; |
| 928 | } |
| 929 | |
| 930 | float32 HELPER(sfsub)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 931 | { |
| 932 | float32 RdV; |
| 933 | arch_fpop_start(env); |
| 934 | RdV = float32_sub(RsV, RtV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 935 | arch_fpop_end(env); |
| 936 | return RdV; |
| 937 | } |
| 938 | |
| 939 | int32_t HELPER(sfcmpeq)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 940 | { |
| 941 | int32_t PdV; |
| 942 | arch_fpop_start(env); |
| 943 | PdV = f8BITSOF(float32_eq_quiet(RsV, RtV, &env->fp_status)); |
| 944 | arch_fpop_end(env); |
| 945 | return PdV; |
| 946 | } |
| 947 | |
| 948 | int32_t HELPER(sfcmpgt)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 949 | { |
| 950 | int cmp; |
| 951 | int32_t PdV; |
| 952 | arch_fpop_start(env); |
| 953 | cmp = float32_compare_quiet(RsV, RtV, &env->fp_status); |
| 954 | PdV = f8BITSOF(cmp == float_relation_greater); |
| 955 | arch_fpop_end(env); |
| 956 | return PdV; |
| 957 | } |
| 958 | |
| 959 | int32_t HELPER(sfcmpge)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 960 | { |
| 961 | int cmp; |
| 962 | int32_t PdV; |
| 963 | arch_fpop_start(env); |
| 964 | cmp = float32_compare_quiet(RsV, RtV, &env->fp_status); |
| 965 | PdV = f8BITSOF(cmp == float_relation_greater || |
| 966 | cmp == float_relation_equal); |
| 967 | arch_fpop_end(env); |
| 968 | return PdV; |
| 969 | } |
| 970 | |
| 971 | int32_t HELPER(sfcmpuo)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 972 | { |
| 973 | int32_t PdV; |
| 974 | arch_fpop_start(env); |
Taylor Simpson | 9a65990 | 2022-02-09 18:15:47 -0800 | [diff] [blame] | 975 | PdV = f8BITSOF(float32_unordered_quiet(RsV, RtV, &env->fp_status)); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 976 | arch_fpop_end(env); |
| 977 | return PdV; |
| 978 | } |
| 979 | |
| 980 | float32 HELPER(sfmax)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 981 | { |
| 982 | float32 RdV; |
| 983 | arch_fpop_start(env); |
Taylor Simpson | d76dd81 | 2022-02-15 20:39:39 -0800 | [diff] [blame] | 984 | RdV = float32_maximum_number(RsV, RtV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 985 | arch_fpop_end(env); |
| 986 | return RdV; |
| 987 | } |
| 988 | |
| 989 | float32 HELPER(sfmin)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 990 | { |
| 991 | float32 RdV; |
| 992 | arch_fpop_start(env); |
Taylor Simpson | d76dd81 | 2022-02-15 20:39:39 -0800 | [diff] [blame] | 993 | RdV = float32_minimum_number(RsV, RtV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 994 | arch_fpop_end(env); |
| 995 | return RdV; |
| 996 | } |
| 997 | |
| 998 | int32_t HELPER(sfclass)(CPUHexagonState *env, float32 RsV, int32_t uiV) |
| 999 | { |
| 1000 | int32_t PdV = 0; |
| 1001 | arch_fpop_start(env); |
| 1002 | if (fGETBIT(0, uiV) && float32_is_zero(RsV)) { |
| 1003 | PdV = 0xff; |
| 1004 | } |
| 1005 | if (fGETBIT(1, uiV) && float32_is_normal(RsV)) { |
| 1006 | PdV = 0xff; |
| 1007 | } |
| 1008 | if (fGETBIT(2, uiV) && float32_is_denormal(RsV)) { |
| 1009 | PdV = 0xff; |
| 1010 | } |
| 1011 | if (fGETBIT(3, uiV) && float32_is_infinity(RsV)) { |
| 1012 | PdV = 0xff; |
| 1013 | } |
| 1014 | if (fGETBIT(4, uiV) && float32_is_any_nan(RsV)) { |
| 1015 | PdV = 0xff; |
| 1016 | } |
| 1017 | set_float_exception_flags(0, &env->fp_status); |
| 1018 | arch_fpop_end(env); |
| 1019 | return PdV; |
| 1020 | } |
| 1021 | |
| 1022 | float32 HELPER(sffixupn)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 1023 | { |
| 1024 | float32 RdV = 0; |
| 1025 | int adjust; |
| 1026 | arch_fpop_start(env); |
| 1027 | arch_sf_recip_common(&RsV, &RtV, &RdV, &adjust, &env->fp_status); |
| 1028 | RdV = RsV; |
| 1029 | arch_fpop_end(env); |
| 1030 | return RdV; |
| 1031 | } |
| 1032 | |
| 1033 | float32 HELPER(sffixupd)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 1034 | { |
| 1035 | float32 RdV = 0; |
| 1036 | int adjust; |
| 1037 | arch_fpop_start(env); |
| 1038 | arch_sf_recip_common(&RsV, &RtV, &RdV, &adjust, &env->fp_status); |
| 1039 | RdV = RtV; |
| 1040 | arch_fpop_end(env); |
| 1041 | return RdV; |
| 1042 | } |
| 1043 | |
| 1044 | float32 HELPER(sffixupr)(CPUHexagonState *env, float32 RsV) |
| 1045 | { |
| 1046 | float32 RdV = 0; |
| 1047 | int adjust; |
| 1048 | arch_fpop_start(env); |
| 1049 | arch_sf_invsqrt_common(&RsV, &RdV, &adjust, &env->fp_status); |
| 1050 | RdV = RsV; |
| 1051 | arch_fpop_end(env); |
| 1052 | return RdV; |
| 1053 | } |
| 1054 | |
| 1055 | float64 HELPER(dfadd)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1056 | { |
| 1057 | float64 RddV; |
| 1058 | arch_fpop_start(env); |
| 1059 | RddV = float64_add(RssV, RttV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1060 | arch_fpop_end(env); |
| 1061 | return RddV; |
| 1062 | } |
| 1063 | |
| 1064 | float64 HELPER(dfsub)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1065 | { |
| 1066 | float64 RddV; |
| 1067 | arch_fpop_start(env); |
| 1068 | RddV = float64_sub(RssV, RttV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1069 | arch_fpop_end(env); |
| 1070 | return RddV; |
| 1071 | } |
| 1072 | |
| 1073 | float64 HELPER(dfmax)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1074 | { |
| 1075 | float64 RddV; |
| 1076 | arch_fpop_start(env); |
Taylor Simpson | d76dd81 | 2022-02-15 20:39:39 -0800 | [diff] [blame] | 1077 | RddV = float64_maximum_number(RssV, RttV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1078 | arch_fpop_end(env); |
| 1079 | return RddV; |
| 1080 | } |
| 1081 | |
| 1082 | float64 HELPER(dfmin)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1083 | { |
| 1084 | float64 RddV; |
| 1085 | arch_fpop_start(env); |
Taylor Simpson | d76dd81 | 2022-02-15 20:39:39 -0800 | [diff] [blame] | 1086 | RddV = float64_minimum_number(RssV, RttV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1087 | arch_fpop_end(env); |
| 1088 | return RddV; |
| 1089 | } |
| 1090 | |
| 1091 | int32_t HELPER(dfcmpeq)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1092 | { |
| 1093 | int32_t PdV; |
| 1094 | arch_fpop_start(env); |
| 1095 | PdV = f8BITSOF(float64_eq_quiet(RssV, RttV, &env->fp_status)); |
| 1096 | arch_fpop_end(env); |
| 1097 | return PdV; |
| 1098 | } |
| 1099 | |
| 1100 | int32_t HELPER(dfcmpgt)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1101 | { |
| 1102 | int cmp; |
| 1103 | int32_t PdV; |
| 1104 | arch_fpop_start(env); |
| 1105 | cmp = float64_compare_quiet(RssV, RttV, &env->fp_status); |
| 1106 | PdV = f8BITSOF(cmp == float_relation_greater); |
| 1107 | arch_fpop_end(env); |
| 1108 | return PdV; |
| 1109 | } |
| 1110 | |
| 1111 | int32_t HELPER(dfcmpge)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1112 | { |
| 1113 | int cmp; |
| 1114 | int32_t PdV; |
| 1115 | arch_fpop_start(env); |
| 1116 | cmp = float64_compare_quiet(RssV, RttV, &env->fp_status); |
| 1117 | PdV = f8BITSOF(cmp == float_relation_greater || |
| 1118 | cmp == float_relation_equal); |
| 1119 | arch_fpop_end(env); |
| 1120 | return PdV; |
| 1121 | } |
| 1122 | |
| 1123 | int32_t HELPER(dfcmpuo)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1124 | { |
| 1125 | int32_t PdV; |
| 1126 | arch_fpop_start(env); |
Taylor Simpson | 9a65990 | 2022-02-09 18:15:47 -0800 | [diff] [blame] | 1127 | PdV = f8BITSOF(float64_unordered_quiet(RssV, RttV, &env->fp_status)); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1128 | arch_fpop_end(env); |
| 1129 | return PdV; |
| 1130 | } |
| 1131 | |
| 1132 | int32_t HELPER(dfclass)(CPUHexagonState *env, float64 RssV, int32_t uiV) |
| 1133 | { |
| 1134 | int32_t PdV = 0; |
| 1135 | arch_fpop_start(env); |
| 1136 | if (fGETBIT(0, uiV) && float64_is_zero(RssV)) { |
| 1137 | PdV = 0xff; |
| 1138 | } |
| 1139 | if (fGETBIT(1, uiV) && float64_is_normal(RssV)) { |
| 1140 | PdV = 0xff; |
| 1141 | } |
| 1142 | if (fGETBIT(2, uiV) && float64_is_denormal(RssV)) { |
| 1143 | PdV = 0xff; |
| 1144 | } |
| 1145 | if (fGETBIT(3, uiV) && float64_is_infinity(RssV)) { |
| 1146 | PdV = 0xff; |
| 1147 | } |
| 1148 | if (fGETBIT(4, uiV) && float64_is_any_nan(RssV)) { |
| 1149 | PdV = 0xff; |
| 1150 | } |
| 1151 | set_float_exception_flags(0, &env->fp_status); |
| 1152 | arch_fpop_end(env); |
| 1153 | return PdV; |
| 1154 | } |
| 1155 | |
| 1156 | float32 HELPER(sfmpy)(CPUHexagonState *env, float32 RsV, float32 RtV) |
| 1157 | { |
| 1158 | float32 RdV; |
| 1159 | arch_fpop_start(env); |
| 1160 | RdV = internal_mpyf(RsV, RtV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1161 | arch_fpop_end(env); |
| 1162 | return RdV; |
| 1163 | } |
| 1164 | |
| 1165 | float32 HELPER(sffma)(CPUHexagonState *env, float32 RxV, |
| 1166 | float32 RsV, float32 RtV) |
| 1167 | { |
| 1168 | arch_fpop_start(env); |
| 1169 | RxV = internal_fmafx(RsV, RtV, RxV, 0, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1170 | arch_fpop_end(env); |
| 1171 | return RxV; |
| 1172 | } |
| 1173 | |
| 1174 | static bool is_zero_prod(float32 a, float32 b) |
| 1175 | { |
| 1176 | return ((float32_is_zero(a) && is_finite(b)) || |
| 1177 | (float32_is_zero(b) && is_finite(a))); |
| 1178 | } |
| 1179 | |
| 1180 | static float32 check_nan(float32 dst, float32 x, float_status *fp_status) |
| 1181 | { |
| 1182 | float32 ret = dst; |
| 1183 | if (float32_is_any_nan(x)) { |
| 1184 | if (extract32(x, 22, 1) == 0) { |
| 1185 | float_raise(float_flag_invalid, fp_status); |
| 1186 | } |
| 1187 | ret = make_float32(0xffffffff); /* nan */ |
| 1188 | } |
| 1189 | return ret; |
| 1190 | } |
| 1191 | |
| 1192 | float32 HELPER(sffma_sc)(CPUHexagonState *env, float32 RxV, |
| 1193 | float32 RsV, float32 RtV, float32 PuV) |
| 1194 | { |
| 1195 | size4s_t tmp; |
| 1196 | arch_fpop_start(env); |
| 1197 | RxV = check_nan(RxV, RxV, &env->fp_status); |
| 1198 | RxV = check_nan(RxV, RsV, &env->fp_status); |
| 1199 | RxV = check_nan(RxV, RtV, &env->fp_status); |
| 1200 | tmp = internal_fmafx(RsV, RtV, RxV, fSXTN(8, 64, PuV), &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1201 | if (!(float32_is_zero(RxV) && is_zero_prod(RsV, RtV))) { |
| 1202 | RxV = tmp; |
| 1203 | } |
| 1204 | arch_fpop_end(env); |
| 1205 | return RxV; |
| 1206 | } |
| 1207 | |
| 1208 | float32 HELPER(sffms)(CPUHexagonState *env, float32 RxV, |
| 1209 | float32 RsV, float32 RtV) |
| 1210 | { |
| 1211 | float32 neg_RsV; |
| 1212 | arch_fpop_start(env); |
Taylor Simpson | 1a442c0 | 2023-03-06 18:58:25 -0800 | [diff] [blame] | 1213 | neg_RsV = float32_set_sign(RsV, float32_is_neg(RsV) ? 0 : 1); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1214 | RxV = internal_fmafx(neg_RsV, RtV, RxV, 0, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1215 | arch_fpop_end(env); |
| 1216 | return RxV; |
| 1217 | } |
| 1218 | |
Taylor Simpson | 2d27ceb | 2021-04-08 20:07:31 -0500 | [diff] [blame] | 1219 | static bool is_inf_prod(int32_t a, int32_t b) |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1220 | { |
| 1221 | return (float32_is_infinity(a) && float32_is_infinity(b)) || |
| 1222 | (float32_is_infinity(a) && is_finite(b) && !float32_is_zero(b)) || |
| 1223 | (float32_is_infinity(b) && is_finite(a) && !float32_is_zero(a)); |
| 1224 | } |
| 1225 | |
| 1226 | float32 HELPER(sffma_lib)(CPUHexagonState *env, float32 RxV, |
| 1227 | float32 RsV, float32 RtV) |
| 1228 | { |
Taylor Simpson | 92cfa25 | 2021-04-08 20:07:35 -0500 | [diff] [blame] | 1229 | bool infinp; |
| 1230 | bool infminusinf; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1231 | float32 tmp; |
| 1232 | |
| 1233 | arch_fpop_start(env); |
| 1234 | set_float_rounding_mode(float_round_nearest_even, &env->fp_status); |
| 1235 | infminusinf = float32_is_infinity(RxV) && |
| 1236 | is_inf_prod(RsV, RtV) && |
| 1237 | (fGETBIT(31, RsV ^ RxV ^ RtV) != 0); |
| 1238 | infinp = float32_is_infinity(RxV) || |
| 1239 | float32_is_infinity(RtV) || |
| 1240 | float32_is_infinity(RsV); |
| 1241 | RxV = check_nan(RxV, RxV, &env->fp_status); |
| 1242 | RxV = check_nan(RxV, RsV, &env->fp_status); |
| 1243 | RxV = check_nan(RxV, RtV, &env->fp_status); |
| 1244 | tmp = internal_fmafx(RsV, RtV, RxV, 0, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1245 | if (!(float32_is_zero(RxV) && is_zero_prod(RsV, RtV))) { |
| 1246 | RxV = tmp; |
| 1247 | } |
| 1248 | set_float_exception_flags(0, &env->fp_status); |
| 1249 | if (float32_is_infinity(RxV) && !infinp) { |
| 1250 | RxV = RxV - 1; |
| 1251 | } |
| 1252 | if (infminusinf) { |
| 1253 | RxV = 0; |
| 1254 | } |
| 1255 | arch_fpop_end(env); |
| 1256 | return RxV; |
| 1257 | } |
| 1258 | |
| 1259 | float32 HELPER(sffms_lib)(CPUHexagonState *env, float32 RxV, |
| 1260 | float32 RsV, float32 RtV) |
| 1261 | { |
Taylor Simpson | 92cfa25 | 2021-04-08 20:07:35 -0500 | [diff] [blame] | 1262 | bool infinp; |
| 1263 | bool infminusinf; |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1264 | float32 tmp; |
| 1265 | |
| 1266 | arch_fpop_start(env); |
| 1267 | set_float_rounding_mode(float_round_nearest_even, &env->fp_status); |
| 1268 | infminusinf = float32_is_infinity(RxV) && |
| 1269 | is_inf_prod(RsV, RtV) && |
| 1270 | (fGETBIT(31, RsV ^ RxV ^ RtV) == 0); |
| 1271 | infinp = float32_is_infinity(RxV) || |
| 1272 | float32_is_infinity(RtV) || |
| 1273 | float32_is_infinity(RsV); |
| 1274 | RxV = check_nan(RxV, RxV, &env->fp_status); |
| 1275 | RxV = check_nan(RxV, RsV, &env->fp_status); |
| 1276 | RxV = check_nan(RxV, RtV, &env->fp_status); |
| 1277 | float32 minus_RsV = float32_sub(float32_zero, RsV, &env->fp_status); |
| 1278 | tmp = internal_fmafx(minus_RsV, RtV, RxV, 0, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1279 | if (!(float32_is_zero(RxV) && is_zero_prod(RsV, RtV))) { |
| 1280 | RxV = tmp; |
| 1281 | } |
| 1282 | set_float_exception_flags(0, &env->fp_status); |
| 1283 | if (float32_is_infinity(RxV) && !infinp) { |
| 1284 | RxV = RxV - 1; |
| 1285 | } |
| 1286 | if (infminusinf) { |
| 1287 | RxV = 0; |
| 1288 | } |
| 1289 | arch_fpop_end(env); |
| 1290 | return RxV; |
| 1291 | } |
| 1292 | |
| 1293 | float64 HELPER(dfmpyfix)(CPUHexagonState *env, float64 RssV, float64 RttV) |
| 1294 | { |
| 1295 | int64_t RddV; |
| 1296 | arch_fpop_start(env); |
| 1297 | if (float64_is_denormal(RssV) && |
| 1298 | (float64_getexp(RttV) >= 512) && |
| 1299 | float64_is_normal(RttV)) { |
| 1300 | RddV = float64_mul(RssV, make_float64(0x4330000000000000), |
| 1301 | &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1302 | } else if (float64_is_denormal(RttV) && |
| 1303 | (float64_getexp(RssV) >= 512) && |
| 1304 | float64_is_normal(RssV)) { |
| 1305 | RddV = float64_mul(RssV, make_float64(0x3cb0000000000000), |
| 1306 | &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1307 | } else { |
| 1308 | RddV = RssV; |
| 1309 | } |
| 1310 | arch_fpop_end(env); |
| 1311 | return RddV; |
| 1312 | } |
| 1313 | |
| 1314 | float64 HELPER(dfmpyhh)(CPUHexagonState *env, float64 RxxV, |
| 1315 | float64 RssV, float64 RttV) |
| 1316 | { |
| 1317 | arch_fpop_start(env); |
| 1318 | RxxV = internal_mpyhh(RssV, RttV, RxxV, &env->fp_status); |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1319 | arch_fpop_end(env); |
| 1320 | return RxxV; |
| 1321 | } |
| 1322 | |
Taylor Simpson | 33e9ed1 | 2021-09-30 11:07:00 -0500 | [diff] [blame] | 1323 | /* Histogram instructions */ |
| 1324 | |
| 1325 | void HELPER(vhist)(CPUHexagonState *env) |
| 1326 | { |
| 1327 | MMVector *input = &env->tmp_VRegs[0]; |
| 1328 | |
| 1329 | for (int lane = 0; lane < 8; lane++) { |
| 1330 | for (int i = 0; i < sizeof(MMVector) / 8; ++i) { |
| 1331 | unsigned char value = input->ub[(sizeof(MMVector) / 8) * lane + i]; |
| 1332 | unsigned char regno = value >> 3; |
| 1333 | unsigned char element = value & 7; |
| 1334 | |
| 1335 | env->VRegs[regno].uh[(sizeof(MMVector) / 16) * lane + element]++; |
| 1336 | } |
| 1337 | } |
| 1338 | } |
| 1339 | |
| 1340 | void HELPER(vhistq)(CPUHexagonState *env) |
| 1341 | { |
| 1342 | MMVector *input = &env->tmp_VRegs[0]; |
| 1343 | |
| 1344 | for (int lane = 0; lane < 8; lane++) { |
| 1345 | for (int i = 0; i < sizeof(MMVector) / 8; ++i) { |
| 1346 | unsigned char value = input->ub[(sizeof(MMVector) / 8) * lane + i]; |
| 1347 | unsigned char regno = value >> 3; |
| 1348 | unsigned char element = value & 7; |
| 1349 | |
| 1350 | if (fGETQBIT(env->qtmp, sizeof(MMVector) / 8 * lane + i)) { |
| 1351 | env->VRegs[regno].uh[ |
| 1352 | (sizeof(MMVector) / 16) * lane + element]++; |
| 1353 | } |
| 1354 | } |
| 1355 | } |
| 1356 | } |
| 1357 | |
| 1358 | void HELPER(vwhist256)(CPUHexagonState *env) |
| 1359 | { |
| 1360 | MMVector *input = &env->tmp_VRegs[0]; |
| 1361 | |
| 1362 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1363 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1364 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1365 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1366 | unsigned int elindex = ((i >> 0) & (~7)) | ((bucket >> 0) & 7); |
| 1367 | |
| 1368 | env->VRegs[vindex].uh[elindex] = |
| 1369 | env->VRegs[vindex].uh[elindex] + weight; |
| 1370 | } |
| 1371 | } |
| 1372 | |
| 1373 | void HELPER(vwhist256q)(CPUHexagonState *env) |
| 1374 | { |
| 1375 | MMVector *input = &env->tmp_VRegs[0]; |
| 1376 | |
| 1377 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1378 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1379 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1380 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1381 | unsigned int elindex = ((i >> 0) & (~7)) | ((bucket >> 0) & 7); |
| 1382 | |
| 1383 | if (fGETQBIT(env->qtmp, 2 * i)) { |
| 1384 | env->VRegs[vindex].uh[elindex] = |
| 1385 | env->VRegs[vindex].uh[elindex] + weight; |
| 1386 | } |
| 1387 | } |
| 1388 | } |
| 1389 | |
| 1390 | void HELPER(vwhist256_sat)(CPUHexagonState *env) |
| 1391 | { |
| 1392 | MMVector *input = &env->tmp_VRegs[0]; |
| 1393 | |
| 1394 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1395 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1396 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1397 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1398 | unsigned int elindex = ((i >> 0) & (~7)) | ((bucket >> 0) & 7); |
| 1399 | |
| 1400 | env->VRegs[vindex].uh[elindex] = |
| 1401 | fVSATUH(env->VRegs[vindex].uh[elindex] + weight); |
| 1402 | } |
| 1403 | } |
| 1404 | |
| 1405 | void HELPER(vwhist256q_sat)(CPUHexagonState *env) |
| 1406 | { |
| 1407 | MMVector *input = &env->tmp_VRegs[0]; |
| 1408 | |
| 1409 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1410 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1411 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1412 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1413 | unsigned int elindex = ((i >> 0) & (~7)) | ((bucket >> 0) & 7); |
| 1414 | |
| 1415 | if (fGETQBIT(env->qtmp, 2 * i)) { |
| 1416 | env->VRegs[vindex].uh[elindex] = |
| 1417 | fVSATUH(env->VRegs[vindex].uh[elindex] + weight); |
| 1418 | } |
| 1419 | } |
| 1420 | } |
| 1421 | |
| 1422 | void HELPER(vwhist128)(CPUHexagonState *env) |
| 1423 | { |
| 1424 | MMVector *input = &env->tmp_VRegs[0]; |
| 1425 | |
| 1426 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1427 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1428 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1429 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1430 | unsigned int elindex = ((i >> 1) & (~3)) | ((bucket >> 1) & 3); |
| 1431 | |
| 1432 | env->VRegs[vindex].uw[elindex] = |
| 1433 | env->VRegs[vindex].uw[elindex] + weight; |
| 1434 | } |
| 1435 | } |
| 1436 | |
| 1437 | void HELPER(vwhist128q)(CPUHexagonState *env) |
| 1438 | { |
| 1439 | MMVector *input = &env->tmp_VRegs[0]; |
| 1440 | |
| 1441 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1442 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1443 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1444 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1445 | unsigned int elindex = ((i >> 1) & (~3)) | ((bucket >> 1) & 3); |
| 1446 | |
| 1447 | if (fGETQBIT(env->qtmp, 2 * i)) { |
| 1448 | env->VRegs[vindex].uw[elindex] = |
| 1449 | env->VRegs[vindex].uw[elindex] + weight; |
| 1450 | } |
| 1451 | } |
| 1452 | } |
| 1453 | |
| 1454 | void HELPER(vwhist128m)(CPUHexagonState *env, int32_t uiV) |
| 1455 | { |
| 1456 | MMVector *input = &env->tmp_VRegs[0]; |
| 1457 | |
| 1458 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1459 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1460 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1461 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1462 | unsigned int elindex = ((i >> 1) & (~3)) | ((bucket >> 1) & 3); |
| 1463 | |
| 1464 | if ((bucket & 1) == uiV) { |
| 1465 | env->VRegs[vindex].uw[elindex] = |
| 1466 | env->VRegs[vindex].uw[elindex] + weight; |
| 1467 | } |
| 1468 | } |
| 1469 | } |
| 1470 | |
| 1471 | void HELPER(vwhist128qm)(CPUHexagonState *env, int32_t uiV) |
| 1472 | { |
| 1473 | MMVector *input = &env->tmp_VRegs[0]; |
| 1474 | |
| 1475 | for (int i = 0; i < (sizeof(MMVector) / 2); i++) { |
| 1476 | unsigned int bucket = fGETUBYTE(0, input->h[i]); |
| 1477 | unsigned int weight = fGETUBYTE(1, input->h[i]); |
| 1478 | unsigned int vindex = (bucket >> 3) & 0x1F; |
| 1479 | unsigned int elindex = ((i >> 1) & (~3)) | ((bucket >> 1) & 3); |
| 1480 | |
| 1481 | if (((bucket & 1) == uiV) && fGETQBIT(env->qtmp, 2 * i)) { |
| 1482 | env->VRegs[vindex].uw[elindex] = |
| 1483 | env->VRegs[vindex].uw[elindex] + weight; |
| 1484 | } |
| 1485 | } |
| 1486 | } |
| 1487 | |
Taylor Simpson | b5ed786 | 2021-02-07 23:45:57 -0600 | [diff] [blame] | 1488 | /* These macros can be referenced in the generated helper functions */ |
| 1489 | #define warn(...) /* Nothing */ |
| 1490 | #define fatal(...) g_assert_not_reached(); |
| 1491 | |
| 1492 | #define BOGUS_HELPER(tag) \ |
| 1493 | printf("ERROR: bogus helper: " #tag "\n") |
| 1494 | |
| 1495 | #include "helper_funcs_generated.c.inc" |