Taylor Simpson | 1547a2d | 2024-01-15 15:14:41 -0700 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | |
| 3 | ## |
| 4 | ## Copyright (c) 2024 Taylor Simpson <ltaylorsimpson@gmail.com> |
| 5 | ## |
| 6 | ## This program is free software; you can redistribute it and/or modify |
| 7 | ## it under the terms of the GNU General Public License as published by |
| 8 | ## the Free Software Foundation; either version 2 of the License, or |
| 9 | ## (at your option) any later version. |
| 10 | ## |
| 11 | ## This program is distributed in the hope that it will be useful, |
| 12 | ## but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 13 | ## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 14 | ## GNU General Public License for more details. |
| 15 | ## |
| 16 | ## You should have received a copy of the GNU General Public License |
| 17 | ## along with this program; if not, see <http://www.gnu.org/licenses/>. |
| 18 | ## |
| 19 | |
| 20 | import io |
| 21 | import re |
| 22 | |
| 23 | import sys |
| 24 | import textwrap |
| 25 | import iset |
| 26 | import hex_common |
| 27 | |
| 28 | encs = { |
| 29 | tag: "".join(reversed(iset.iset[tag]["enc"].replace(" ", ""))) |
| 30 | for tag in iset.tags |
| 31 | if iset.iset[tag]["enc"] != "MISSING ENCODING" |
| 32 | } |
| 33 | |
| 34 | |
| 35 | regre = re.compile(r"((?<!DUP)[MNORCPQXSGVZA])([stuvwxyzdefg]+)([.]?[LlHh]?)(\d+S?)") |
| 36 | immre = re.compile(r"[#]([rRsSuUm])(\d+)(?:[:](\d+))?") |
| 37 | |
| 38 | |
| 39 | def ordered_unique(l): |
| 40 | return sorted(set(l), key=l.index) |
| 41 | |
| 42 | num_registers = {"R": 32, "V": 32} |
| 43 | |
| 44 | operand_letters = { |
| 45 | "P", |
| 46 | "i", |
| 47 | "I", |
| 48 | "r", |
| 49 | "s", |
| 50 | "t", |
| 51 | "u", |
| 52 | "v", |
| 53 | "w", |
| 54 | "x", |
| 55 | "y", |
| 56 | "z", |
| 57 | "d", |
| 58 | "e", |
| 59 | "f", |
| 60 | "g", |
| 61 | } |
| 62 | |
| 63 | # |
| 64 | # These instructions have unused operand letters in their encoding |
| 65 | # They don't correspond to actual operands in the instruction semantics |
| 66 | # We will mark them as ignored in QEMU decodetree |
| 67 | # |
| 68 | tags_with_unused_d_encoding = { |
| 69 | "R6_release_at_vi", |
| 70 | "R6_release_st_vi", |
| 71 | "S4_stored_rl_at_vi", |
| 72 | "S4_stored_rl_st_vi", |
| 73 | "S2_storew_rl_at_vi", |
| 74 | "S2_stored_rl_at_vi", |
| 75 | "S2_storew_rl_st_vi", |
| 76 | } |
| 77 | |
| 78 | tags_with_unused_t_encoding = { |
| 79 | "R6_release_at_vi", |
| 80 | "R6_release_st_vi", |
| 81 | } |
| 82 | |
| 83 | def skip_tag(tag, class_to_decode): |
| 84 | enc_class = iset.iset[tag]["enc_class"] |
| 85 | return enc_class != class_to_decode |
| 86 | |
| 87 | |
| 88 | ## |
| 89 | ## Generate the QEMU decodetree file for each instruction in class_to_decode |
| 90 | ## For A2_add: Rd32=add(Rs32,Rt32) |
| 91 | ## We produce: |
| 92 | ## %A2_add_Rd 0:5 |
| 93 | ## %A2_add_Rs 16:5 |
| 94 | ## %A2_add_Rt 8:5 |
| 95 | ## @A2_add 11110011000.......-.....---..... Rd=%A2_add_Rd Rs=%A2_add_Rs Rt=%A2_add_Rt %PP |
| 96 | ## A2_add ..................-.....---..... @A2_add |
| 97 | ## |
| 98 | def gen_decodetree_file(f, class_to_decode): |
Taylor Simpson | f6c0100 | 2024-01-15 15:14:42 -0700 | [diff] [blame] | 99 | is_subinsn = class_to_decode.startswith("SUBINSN_") |
Taylor Simpson | 1547a2d | 2024-01-15 15:14:41 -0700 | [diff] [blame] | 100 | f.write(f"## DO NOT MODIFY - This file is generated by {sys.argv[0]}\n\n") |
Taylor Simpson | f6c0100 | 2024-01-15 15:14:42 -0700 | [diff] [blame] | 101 | if not is_subinsn: |
| 102 | f.write("%PP\t14:2\n\n") |
Taylor Simpson | 1547a2d | 2024-01-15 15:14:41 -0700 | [diff] [blame] | 103 | for tag in sorted(encs.keys(), key=iset.tags.index): |
| 104 | if skip_tag(tag, class_to_decode): |
| 105 | continue |
| 106 | |
| 107 | enc = encs[tag] |
| 108 | enc_str = "".join(reversed(encs[tag])) |
| 109 | f.write(("#" * 80) + "\n" |
| 110 | f"## {tag}:\t{enc_str}\n" |
| 111 | "##\n") |
| 112 | |
Taylor Simpson | f6c0100 | 2024-01-15 15:14:42 -0700 | [diff] [blame] | 113 | # The subinstructions come with a 13-bit encoding, but |
| 114 | # decodetree.py needs 16 bits |
| 115 | if is_subinsn: |
| 116 | enc_str = "---" + enc_str |
Taylor Simpson | 1547a2d | 2024-01-15 15:14:41 -0700 | [diff] [blame] | 117 | |
| 118 | regs = ordered_unique(regre.findall(iset.iset[tag]["syntax"])) |
| 119 | imms = ordered_unique(immre.findall(iset.iset[tag]["syntax"])) |
| 120 | |
| 121 | # Write the field definitions for the registers |
| 122 | for regno, reg in enumerate(regs): |
| 123 | reg_type, reg_id, _, reg_enc_size = reg |
| 124 | reg_letter = reg_id[0] |
| 125 | reg_num_choices = int(reg_enc_size.rstrip("S")) |
| 126 | reg_mapping = reg_type + "".join("_" for letter in reg_id) + \ |
| 127 | reg_enc_size |
| 128 | reg_enc_fields = re.findall(reg_letter + "+", enc) |
| 129 | |
| 130 | # Check for some errors |
| 131 | if len(reg_enc_fields) == 0: |
| 132 | raise Exception(f"{tag} missing register field!") |
| 133 | if len(reg_enc_fields) > 1: |
| 134 | raise Exception(f"{tag} has split register field!") |
| 135 | reg_enc_field = reg_enc_fields[0] |
| 136 | if 2 ** len(reg_enc_field) != reg_num_choices: |
| 137 | raise Exception(f"{tag} has incorrect register field width!") |
| 138 | |
| 139 | f.write(f"%{tag}_{reg_type}{reg_id}\t" |
| 140 | f"{enc.index(reg_enc_field)}:{len(reg_enc_field)}") |
| 141 | |
| 142 | if (reg_type in num_registers and |
| 143 | reg_num_choices != num_registers[reg_type]): |
| 144 | f.write(f"\t!function=decode_mapped_reg_{reg_mapping}") |
| 145 | f.write("\n") |
| 146 | |
| 147 | # Write the field definitions for the immediates |
| 148 | for imm in imms: |
| 149 | immno = 1 if imm[0].isupper() else 0 |
| 150 | imm_type = imm[0] |
| 151 | imm_width = int(imm[1]) |
| 152 | imm_letter = "i" if imm_type.islower() else "I" |
| 153 | fields = [] |
| 154 | sign_mark = "s" if imm_type.lower() in "sr" else "" |
| 155 | for m in reversed(list(re.finditer(imm_letter + "+", enc))): |
| 156 | fields.append(f"{m.start()}:{sign_mark}{m.end() - m.start()}") |
| 157 | sign_mark = "" |
| 158 | field_str = " ".join(fields) |
| 159 | f.write(f"%{tag}_{imm_type}{imm_letter}\t{field_str}\n") |
| 160 | |
| 161 | ## Handle instructions with unused encoding letters |
| 162 | ## Change the unused letters to ignored |
| 163 | if tag in tags_with_unused_d_encoding: |
| 164 | enc_str = enc_str.replace("d", "-") |
| 165 | if tag in tags_with_unused_t_encoding: |
| 166 | enc_str = enc_str.replace("t", "-") |
| 167 | |
| 168 | # Replace the operand letters with . |
| 169 | for x in operand_letters: |
| 170 | enc_str = enc_str.replace(x, ".") |
| 171 | |
| 172 | # Write the instruction format |
| 173 | f.write(f"@{tag}\t{enc_str}") |
| 174 | for reg in regs: |
| 175 | reg_type = reg[0] |
| 176 | reg_id = reg[1] |
| 177 | f.write(f" {reg_type}{reg_id}=%{tag}_{reg_type}{reg_id}") |
| 178 | for imm in imms: |
| 179 | imm_type = imm[0] |
| 180 | imm_letter = "i" if imm_type.islower() else "I" |
| 181 | f.write(f" {imm_type}{imm_letter}=%{tag}_{imm_type}{imm_letter}") |
| 182 | |
Taylor Simpson | f6c0100 | 2024-01-15 15:14:42 -0700 | [diff] [blame] | 183 | if not is_subinsn: |
| 184 | f.write(" %PP") |
| 185 | f.write("\n") |
Taylor Simpson | 1547a2d | 2024-01-15 15:14:41 -0700 | [diff] [blame] | 186 | |
| 187 | # Replace the 0s and 1s with . |
| 188 | enc_str = enc_str.replace("0", ".").replace("1", ".") |
| 189 | |
| 190 | # Write the instruction pattern |
| 191 | f.write(f"{tag}\t{enc_str} @{tag}\n") |
| 192 | |
| 193 | |
| 194 | if __name__ == "__main__": |
| 195 | hex_common.read_semantics_file(sys.argv[1]) |
| 196 | class_to_decode = sys.argv[2] |
| 197 | with open(sys.argv[3], "w") as f: |
| 198 | gen_decodetree_file(f, class_to_decode) |