target/hexagon/gen_decodetree.py

1547a2d3STaylor Simpson#!/usr/bin/env python3
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson##  Copyright (c) 2024 Taylor Simpson <ltaylorsimpson@gmail.com>
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson##  This program is free software; you can redistribute it and/or modify
1547a2d3STaylor Simpson##  it under the terms of the GNU General Public License as published by
1547a2d3STaylor Simpson##  the Free Software Foundation; either version 2 of the License, or
1547a2d3STaylor Simpson##  (at your option) any later version.
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson##  This program is distributed in the hope that it will be useful,
1547a2d3STaylor Simpson##  but WITHOUT ANY WARRANTY; without even the implied warranty of
1547a2d3STaylor Simpson##  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
1547a2d3STaylor Simpson##  GNU General Public License for more details.
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson##  You should have received a copy of the GNU General Public License
1547a2d3STaylor Simpson##  along with this program; if not, see <http://www.gnu.org/licenses/>.
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonimport io
1547a2d3STaylor Simpsonimport re
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonimport sys
1547a2d3STaylor Simpsonimport textwrap
1547a2d3STaylor Simpsonimport iset
1547a2d3STaylor Simpsonimport hex_common
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonencs = {
1547a2d3STaylor Simpson    tag: "".join(reversed(iset.iset[tag]["enc"].replace(" ", "")))
1547a2d3STaylor Simpson    for tag in iset.tags
1547a2d3STaylor Simpson    if iset.iset[tag]["enc"] != "MISSING ENCODING"
1547a2d3STaylor Simpson}
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonregre = re.compile(r"((?<!DUP)[MNORCPQXSGVZA])([stuvwxyzdefg]+)([.]?[LlHh]?)(\d+S?)")
1547a2d3STaylor Simpsonimmre = re.compile(r"[#]([rRsSuUm])(\d+)(?:[:](\d+))?")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsondef ordered_unique(l):
1547a2d3STaylor Simpson    return sorted(set(l), key=l.index)
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonnum_registers = {"R": 32, "V": 32}
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonoperand_letters = {
1547a2d3STaylor Simpson    "P",
1547a2d3STaylor Simpson    "i",
1547a2d3STaylor Simpson    "I",
1547a2d3STaylor Simpson    "r",
1547a2d3STaylor Simpson    "s",
1547a2d3STaylor Simpson    "t",
1547a2d3STaylor Simpson    "u",
1547a2d3STaylor Simpson    "v",
1547a2d3STaylor Simpson    "w",
1547a2d3STaylor Simpson    "x",
1547a2d3STaylor Simpson    "y",
1547a2d3STaylor Simpson    "z",
1547a2d3STaylor Simpson    "d",
1547a2d3STaylor Simpson    "e",
1547a2d3STaylor Simpson    "f",
1547a2d3STaylor Simpson    "g",
1547a2d3STaylor Simpson}
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson#
1547a2d3STaylor Simpson# These instructions have unused operand letters in their encoding
1547a2d3STaylor Simpson# They don't correspond to actual operands in the instruction semantics
1547a2d3STaylor Simpson# We will mark them as ignored in QEMU decodetree
1547a2d3STaylor Simpson#
1547a2d3STaylor Simpsontags_with_unused_d_encoding = {
1547a2d3STaylor Simpson    "R6_release_at_vi",
1547a2d3STaylor Simpson    "R6_release_st_vi",
1547a2d3STaylor Simpson    "S4_stored_rl_at_vi",
1547a2d3STaylor Simpson    "S4_stored_rl_st_vi",
1547a2d3STaylor Simpson    "S2_storew_rl_at_vi",
1547a2d3STaylor Simpson    "S2_stored_rl_at_vi",
1547a2d3STaylor Simpson    "S2_storew_rl_st_vi",
1547a2d3STaylor Simpson}
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsontags_with_unused_t_encoding = {
1547a2d3STaylor Simpson    "R6_release_at_vi",
1547a2d3STaylor Simpson    "R6_release_st_vi",
1547a2d3STaylor Simpson}
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsondef skip_tag(tag, class_to_decode):
1547a2d3STaylor Simpson    enc_class = iset.iset[tag]["enc_class"]
1547a2d3STaylor Simpson    return enc_class != class_to_decode
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpson## Generate the QEMU decodetree file for each instruction in class_to_decode
1547a2d3STaylor Simpson##     For A2_add: Rd32=add(Rs32,Rt32)
1547a2d3STaylor Simpson##     We produce:
1547a2d3STaylor Simpson##     %A2_add_Rd   0:5
1547a2d3STaylor Simpson##     %A2_add_Rs   16:5
1547a2d3STaylor Simpson##     %A2_add_Rt   8:5
1547a2d3STaylor Simpson##     @A2_add  11110011000.......-.....---..... Rd=%A2_add_Rd Rs=%A2_add_Rs Rt=%A2_add_Rt %PP
1547a2d3STaylor Simpson##     A2_add   ..................-.....---..... @A2_add
1547a2d3STaylor Simpson##
1547a2d3STaylor Simpsondef gen_decodetree_file(f, class_to_decode):
*f6c01009STaylor Simpson    is_subinsn = class_to_decode.startswith("SUBINSN_")
1547a2d3STaylor Simpson    f.write(f"## DO NOT MODIFY - This file is generated by {sys.argv[0]}\n\n")
*f6c01009STaylor Simpson    if not is_subinsn:
1547a2d3STaylor Simpson        f.write("%PP\t14:2\n\n")
1547a2d3STaylor Simpson    for tag in sorted(encs.keys(), key=iset.tags.index):
1547a2d3STaylor Simpson        if skip_tag(tag, class_to_decode):
1547a2d3STaylor Simpson            continue
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        enc = encs[tag]
1547a2d3STaylor Simpson        enc_str = "".join(reversed(encs[tag]))
1547a2d3STaylor Simpson        f.write(("#" * 80) + "\n"
1547a2d3STaylor Simpson                f"## {tag}:\t{enc_str}\n"
1547a2d3STaylor Simpson                "##\n")
1547a2d3STaylor Simpson
*f6c01009STaylor Simpson        # The subinstructions come with a 13-bit encoding, but
*f6c01009STaylor Simpson        # decodetree.py needs 16 bits
*f6c01009STaylor Simpson        if is_subinsn:
*f6c01009STaylor Simpson            enc_str = "---" + enc_str
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        regs = ordered_unique(regre.findall(iset.iset[tag]["syntax"]))
1547a2d3STaylor Simpson        imms = ordered_unique(immre.findall(iset.iset[tag]["syntax"]))
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        # Write the field definitions for the registers
1547a2d3STaylor Simpson        for regno, reg in enumerate(regs):
1547a2d3STaylor Simpson            reg_type, reg_id, _, reg_enc_size = reg
1547a2d3STaylor Simpson            reg_letter = reg_id[0]
1547a2d3STaylor Simpson            reg_num_choices = int(reg_enc_size.rstrip("S"))
1547a2d3STaylor Simpson            reg_mapping = reg_type + "".join("_" for letter in reg_id) + \
1547a2d3STaylor Simpson                          reg_enc_size
1547a2d3STaylor Simpson            reg_enc_fields = re.findall(reg_letter + "+", enc)
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson            # Check for some errors
1547a2d3STaylor Simpson            if len(reg_enc_fields) == 0:
1547a2d3STaylor Simpson                raise Exception(f"{tag} missing register field!")
1547a2d3STaylor Simpson            if len(reg_enc_fields) > 1:
1547a2d3STaylor Simpson                raise Exception(f"{tag} has split register field!")
1547a2d3STaylor Simpson            reg_enc_field = reg_enc_fields[0]
1547a2d3STaylor Simpson            if 2 ** len(reg_enc_field) != reg_num_choices:
1547a2d3STaylor Simpson                raise Exception(f"{tag} has incorrect register field width!")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson            f.write(f"%{tag}_{reg_type}{reg_id}\t"
1547a2d3STaylor Simpson                    f"{enc.index(reg_enc_field)}:{len(reg_enc_field)}")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson            if (reg_type in num_registers and
1547a2d3STaylor Simpson                reg_num_choices != num_registers[reg_type]):
1547a2d3STaylor Simpson                f.write(f"\t!function=decode_mapped_reg_{reg_mapping}")
1547a2d3STaylor Simpson            f.write("\n")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        # Write the field definitions for the immediates
1547a2d3STaylor Simpson        for imm in imms:
1547a2d3STaylor Simpson            immno = 1 if imm[0].isupper() else 0
1547a2d3STaylor Simpson            imm_type = imm[0]
1547a2d3STaylor Simpson            imm_width = int(imm[1])
1547a2d3STaylor Simpson            imm_letter = "i" if imm_type.islower() else "I"
1547a2d3STaylor Simpson            fields = []
1547a2d3STaylor Simpson            sign_mark = "s" if imm_type.lower() in "sr" else ""
1547a2d3STaylor Simpson            for m in reversed(list(re.finditer(imm_letter + "+", enc))):
1547a2d3STaylor Simpson                fields.append(f"{m.start()}:{sign_mark}{m.end() - m.start()}")
1547a2d3STaylor Simpson                sign_mark = ""
1547a2d3STaylor Simpson            field_str = " ".join(fields)
1547a2d3STaylor Simpson            f.write(f"%{tag}_{imm_type}{imm_letter}\t{field_str}\n")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        ## Handle instructions with unused encoding letters
1547a2d3STaylor Simpson        ## Change the unused letters to ignored
1547a2d3STaylor Simpson        if tag in tags_with_unused_d_encoding:
1547a2d3STaylor Simpson            enc_str = enc_str.replace("d", "-")
1547a2d3STaylor Simpson        if tag in tags_with_unused_t_encoding:
1547a2d3STaylor Simpson            enc_str = enc_str.replace("t", "-")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        # Replace the operand letters with .
1547a2d3STaylor Simpson        for x in operand_letters:
1547a2d3STaylor Simpson            enc_str = enc_str.replace(x, ".")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        # Write the instruction format
1547a2d3STaylor Simpson        f.write(f"@{tag}\t{enc_str}")
1547a2d3STaylor Simpson        for reg in regs:
1547a2d3STaylor Simpson            reg_type = reg[0]
1547a2d3STaylor Simpson            reg_id = reg[1]
1547a2d3STaylor Simpson            f.write(f" {reg_type}{reg_id}=%{tag}_{reg_type}{reg_id}")
1547a2d3STaylor Simpson        for imm in imms:
1547a2d3STaylor Simpson            imm_type = imm[0]
1547a2d3STaylor Simpson            imm_letter = "i" if imm_type.islower() else "I"
1547a2d3STaylor Simpson            f.write(f" {imm_type}{imm_letter}=%{tag}_{imm_type}{imm_letter}")
1547a2d3STaylor Simpson
*f6c01009STaylor Simpson        if not is_subinsn:
*f6c01009STaylor Simpson            f.write(" %PP")
*f6c01009STaylor Simpson        f.write("\n")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson         # Replace the 0s and 1s with .
1547a2d3STaylor Simpson        enc_str = enc_str.replace("0", ".").replace("1", ".")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson        # Write the instruction pattern
1547a2d3STaylor Simpson        f.write(f"{tag}\t{enc_str} @{tag}\n")
1547a2d3STaylor Simpson
1547a2d3STaylor Simpson
1547a2d3STaylor Simpsonif __name__ == "__main__":
1547a2d3STaylor Simpson    hex_common.read_semantics_file(sys.argv[1])
1547a2d3STaylor Simpson    class_to_decode = sys.argv[2]
1547a2d3STaylor Simpson    with open(sys.argv[3], "w") as f:
1547a2d3STaylor Simpson        gen_decodetree_file(f, class_to_decode)