From 1b0ef5d896a1652dc52a5353521d9990d481c76b Mon Sep 17 00:00:00 2001
From: IIITM-Jay <jaydev.neuroscitech@gmail.com>
Date: Tue, 17 Sep 2024 00:53:00 +0530
Subject: [PATCH] Refactored and Optimized Logic:: Parser Logic, Latex Based
 Output & Shared Modules

---
 c_utils.py        |   71 +++
 chisel_utils.py   |   88 ++++
 go_utils.py       |   65 +++
 latex_utils.py    |  435 +++++++++++++++++
 parse.py          | 1182 ++++-----------------------------------------
 rust_utils.py     |   31 ++
 shared_utils.py   |  547 +++++++++++++++++++++
 sverilog_utils.py |   30 ++
 8 files changed, 1368 insertions(+), 1081 deletions(-)
 create mode 100644 c_utils.py
 create mode 100644 chisel_utils.py
 create mode 100644 go_utils.py
 create mode 100644 latex_utils.py
 create mode 100644 rust_utils.py
 create mode 100644 shared_utils.py
 create mode 100644 sverilog_utils.py

diff --git a/c_utils.py b/c_utils.py
new file mode 100644
index 00000000..4143625f
--- /dev/null
+++ b/c_utils.py
@@ -0,0 +1,71 @@
+import re
+import glob
+import os
+import pprint
+import logging
+import collections
+import yaml
+import sys
+# from shared_utils import overlaps, overlap_allowed, extension_overlap_allowed, instruction_overlap_allowed, process_enc_line, same_base_isa, add_segmented_vls_insn, expand_nf_field
+from shared_utils import *
+
+pp = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
+
+def make_c(instr_dict):
+    mask_match_str = ''
+    declare_insn_str = ''
+    for i in instr_dict:
+        mask_match_str += f'#define MATCH_{i.upper().replace(".","_")} {instr_dict[i]["match"]}\n'
+        mask_match_str += f'#define MASK_{i.upper().replace(".","_")} {instr_dict[i]["mask"]}\n'
+        declare_insn_str += f'DECLARE_INSN({i.replace(".","_")}, MATCH_{i.upper().replace(".","_")}, MASK_{i.upper().replace(".","_")})\n'
+
+    csr_names_str = ''
+    declare_csr_str = ''
+    for num, name in csrs+csrs32:
+        csr_names_str += f'#define CSR_{name.upper()} {hex(num)}\n'
+        declare_csr_str += f'DECLARE_CSR({name}, CSR_{name.upper()})\n'
+
+    causes_str= ''
+    declare_cause_str = ''
+    for num, name in causes:
+        causes_str += f"#define CAUSE_{name.upper().replace(' ', '_')} {hex(num)}\n"
+        declare_cause_str += f"DECLARE_CAUSE(\"{name}\", CAUSE_{name.upper().replace(' ','_')})\n"
+
+    arg_str = ''
+    for name, rng in arg_lut.items():
+        begin = rng[1]
+        end   = rng[0]
+        mask = ((1 << (end - begin + 1)) - 1) << begin
+        arg_str += f"#define INSN_FIELD_{name.upper().replace(' ', '_')} {hex(mask)}\n"
+
+    with open(f'{os.path.dirname(__file__)}/encoding.h', 'r') as file:
+        enc_header = file.read()
+
+    commit = os.popen('git log -1 --format="format:%h"').read()
+    enc_file = open('encoding.out.h','w')
+    enc_file.write(f'''/* SPDX-License-Identifier: BSD-3-Clause */
+
+/* Copyright (c) 2023 RISC-V International */
+
+/*
+ * This file is auto-generated by running 'make' in
+ * https://github.com/riscv/riscv-opcodes ({commit})
+ */
+
+{enc_header}
+/* Automatically generated by parse_opcodes. */
+#ifndef RISCV_ENCODING_H
+#define RISCV_ENCODING_H
+{mask_match_str}
+{csr_names_str}
+{causes_str}
+{arg_str}#endif
+#ifdef DECLARE_INSN
+{declare_insn_str}#endif
+#ifdef DECLARE_CSR
+{declare_csr_str}#endif
+#ifdef DECLARE_CAUSE
+{declare_cause_str}#endif
+''')
+    enc_file.close()
diff --git a/chisel_utils.py b/chisel_utils.py
new file mode 100644
index 00000000..061eef4b
--- /dev/null
+++ b/chisel_utils.py
@@ -0,0 +1,88 @@
+from constants import *
+import copy
+import re
+import glob
+import os
+import pprint
+import logging
+import collections
+import yaml
+import sys
+# from shared_utils import overlaps, overlap_allowed, extension_overlap_allowed, instruction_overlap_allowed, process_enc_line, same_base_isa, add_segmented_vls_insn, expand_nf_field
+from shared_utils import *
+
+pp = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
+
+def make_chisel(instr_dict, spinal_hdl=False):
+
+    chisel_names=''
+    cause_names_str=''
+    csr_names_str = ''
+    for i in instr_dict:
+        if spinal_hdl:
+            chisel_names += f'  def {i.upper().replace(".","_"):<18s} = M"b{instr_dict[i]["encoding"].replace("-","-")}"\n'
+        # else:
+        #     chisel_names += f'  def {i.upper().replace(".","_"):<18s} = BitPat("b{instr_dict[i]["encoding"].replace("-","?")}")\n'
+    if not spinal_hdl:
+        extensions = instr_dict_2_extensions(instr_dict)
+        for e in extensions:
+            e_instrs = filter(lambda i: instr_dict[i]['extension'][0] == e, instr_dict)
+            if "rv64_" in e:
+                e_format = e.replace("rv64_", "").upper() + "64"
+            elif "rv32_" in e:
+                e_format = e.replace("rv32_", "").upper() + "32"
+            elif "rv_" in e:
+                e_format = e.replace("rv_", "").upper()
+            else:
+                e_format = e.upper
+            chisel_names += f'  val {e_format+"Type"} = Map(\n'
+            for instr in e_instrs:
+                tmp_instr_name = '"'+instr.upper().replace(".","_")+'"'
+                chisel_names += f'   {tmp_instr_name:<18s} -> BitPat("b{instr_dict[instr]["encoding"].replace("-","?")}"),\n'
+            chisel_names += f'  )\n'
+
+    for num, name in causes:
+        cause_names_str += f'  val {name.lower().replace(" ","_")} = {hex(num)}\n'
+    cause_names_str += '''  val all = {
+    val res = collection.mutable.ArrayBuffer[Int]()
+'''
+    for num, name in causes:
+        cause_names_str += f'    res += {name.lower().replace(" ","_")}\n'
+    cause_names_str += '''    res.toArray
+  }'''
+
+    for num, name in csrs+csrs32:
+        csr_names_str += f'  val {name} = {hex(num)}\n'
+    csr_names_str += '''  val all = {
+    val res = collection.mutable.ArrayBuffer[Int]()
+'''
+    for num, name in csrs:
+        csr_names_str += f'''    res += {name}\n'''
+    csr_names_str += '''    res.toArray
+  }
+  val all32 = {
+    val res = collection.mutable.ArrayBuffer(all:_*)
+'''
+    for num, name in csrs32:
+        csr_names_str += f'''    res += {name}\n'''
+    csr_names_str += '''    res.toArray
+  }'''
+
+    if spinal_hdl:
+        chisel_file = open('inst.spinalhdl','w')
+    else:
+        chisel_file = open('inst.chisel','w')
+    chisel_file.write(f'''
+/* Automatically generated by parse_opcodes */
+object Instructions {{
+{chisel_names}
+}}
+object Causes {{
+{cause_names_str}
+}}
+object CSRs {{
+{csr_names_str}
+}}
+''')
+    chisel_file.close()
diff --git a/go_utils.py b/go_utils.py
new file mode 100644
index 00000000..9c5ef2b1
--- /dev/null
+++ b/go_utils.py
@@ -0,0 +1,65 @@
+import re
+import glob
+import os
+import pprint
+import logging
+import collections
+import yaml
+import sys
+# from shared_utils import overlaps, overlap_allowed, extension_overlap_allowed, instruction_overlap_allowed, process_enc_line, same_base_isa, add_segmented_vls_insn, expand_nf_field
+from shared_utils import *
+
+pp = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
+
+def make_go(instr_dict):
+
+    args = " ".join(sys.argv)
+    prelude = f'''// Code generated by {args}; DO NOT EDIT.'''
+
+    prelude += '''
+package riscv
+
+import "cmd/internal/obj"
+
+type inst struct {
+	opcode uint32
+	funct3 uint32
+	rs1    uint32
+	rs2    uint32
+	csr    int64
+	funct7 uint32
+}
+
+func encode(a obj.As) *inst {
+	switch a {
+'''
+
+    endoffile = '''  }
+	return nil
+}
+'''
+
+    instr_str = ''
+    for i in instr_dict:
+        enc_match = int(instr_dict[i]['match'],0)
+        opcode = (enc_match >> 0) & ((1<<7)-1)
+        funct3 = (enc_match >> 12) & ((1<<3)-1)
+        rs1 = (enc_match >> 15) & ((1<<5)-1)
+        rs2 = (enc_match >> 20) & ((1<<5)-1)
+        csr = (enc_match >> 20) & ((1<<12)-1)
+        funct7 = (enc_match >> 25) & ((1<<7)-1)
+        instr_str += f'''  case A{i.upper().replace("_","")}:
+    return &inst{{ {hex(opcode)}, {hex(funct3)}, {hex(rs1)}, {hex(rs2)}, {signed(csr,12)}, {hex(funct7)} }}
+'''
+        
+    with open('inst.go','w') as file:
+        file.write(prelude)
+        file.write(instr_str)
+        file.write(endoffile)
+
+    try:
+        import subprocess
+        subprocess.run(["go", "fmt", "inst.go"])
+    except:
+        pass
\ No newline at end of file
diff --git a/latex_utils.py b/latex_utils.py
new file mode 100644
index 00000000..59a8bb52
--- /dev/null
+++ b/latex_utils.py
@@ -0,0 +1,435 @@
+#!/usr/bin/env python3
+import pprint
+import logging
+from constants import *
+from shared_utils import create_inst_dict
+
+LOG_FORMAT = '%(levelname)s:: %(message)s'
+LOG_LEVEL = logging.INFO
+
+pretty_printer = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=LOG_LEVEL, format=LOG_FORMAT)
+
+
+def create_priv_instr_dataset():
+    """Create dataset list for privileged instructions."""
+    system_instr = ['_h', '_s', '_system', '_svinval', '64_h']
+    return [
+        (system_instr, 'Trap-Return Instructions', ['sret', 'mret'], False),
+        (system_instr, 'Interrupt-Management Instructions', ['wfi'], False),
+        (system_instr, 'Supervisor Memory-Management Instructions', ['sfence_vma'], False),
+        (system_instr, 'Hypervisor Memory-Management Instructions', ['hfence_vvma', 'hfence_gvma'], False),
+        (system_instr, 'Hypervisor Virtual-Machine Load and Store Instructions', 
+            ['hlv_b', 'hlv_bu', 'hlv_h', 'hlv_hu', 'hlv_w', 'hlvx_hu', 'hlvx_wu', 'hsv_b', 'hsv_h', 'hsv_w'], False),
+        (system_instr, 'Hypervisor Virtual-Machine Load and Store Instructions, RV64 only', ['hlv_wu', 'hlv_d', 'hsv_d'], False),
+        (system_instr, 'Svinval Memory-Management Instructions', ['sinval_vma', 'sfence_w_inval', 'sfence_inval_ir', 'hinval_vvma', 'hinval_gvma'], False)
+    ]
+
+
+def make_priv_latex_table():
+    """Generate and write the LaTeX table for privileged instructions."""
+    type_list = ['R-type', 'I-type']
+    dataset_list = create_priv_instr_dataset()
+    caption = '\\caption{RISC-V Privileged Instructions}'
+
+    with open('priv-instr-table.tex', 'w') as latex_file:
+        make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
+
+
+def make_latex_table():
+    '''
+    - This function is mean to create the instr-table.tex that is meant to be used
+    by the riscv-isa-manual.
+        1. creates a single latex file of multiple table
+        2. Each table limited to a single page
+        3. Only the last table is assigned a latex-caption.
+        
+    - For each table, we assign a type-list that captures the different instruction types (R, I, B, etc.) required for that table.
+        1. Specify the type-list to capture various instruction types (e.g., R-type, I-type, B-type).
+        2. Select a list of extensions (e.g., _i, 32_i) whose instructions are necessary to populate the table.
+        3. For each extension or collection of extensions, assign a title that appears as a subheading within the table (these are inlined headings, not captions).
+
+    * All of the above information is collected/created and sent to
+    make_ext_latex_table function to dump out the latex contents into a file.
+
+    * The last table only has to be given a caption - as per the policy of the
+    riscv-isa-manual.
+    '''
+    # File for writing LaTeX content
+    with open('instr-table.tex', 'w') as latex_file:
+        # Prepare table configurations with type list, datasets, word size & caption
+        table_configurations = get_table_configurations()
+        
+        # Map each configuration from above with variables to pass as argumnet
+        for config in table_configurations:
+            # Unpack configuration dictionary into arguments for make_ext_latex_table
+            type_list = config['type_list']
+            datasets = config['datasets']
+            word_size = config['word_size']
+            caption = config['caption']
+            
+            # LaTeX table generation function
+            make_ext_latex_table(
+                type_list, 
+                datasets, 
+                latex_file, 
+                word_size, 
+                caption
+            )
+
+
+def get_table_configurations():
+    '''
+    Returns a list of table configurations, each specifying the type list, datasets,
+    word size, and caption for LaTeX table generation.
+    
+    Returns:
+        list: A list of dictionaries, each representing a table's configuration.
+    '''
+    return [
+        create_table_configuration(
+            type_list=['R-type', 'I-type', 'S-type', 'B-type', 'U-type', 'J-type'],
+            datasets=[
+                create_dataset(['_i', '32_i'], 'RV32I Base Instruction Set', [], False),
+                create_dataset(['_i'], '', ['fence_tso', 'pause'], True)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type', 'I-type', 'S-type'],
+            datasets=[
+                create_dataset(['64_i'], 'RV64I Base Instruction Set (in addition to RV32I)', [], False),
+                create_dataset(['_zifencei'], 'RV32/RV64 Zifencei Standard Extension', [], False),
+                create_dataset(['_zicsr'], 'RV32/RV64 Zicsr Standard Extension', [], False),
+                create_dataset(['_m', '32_m'], 'RV32M Standard Extension', [], False),
+                create_dataset(['64_m'], 'RV64M Standard Extension (in addition to RV32M)', [], False)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type'],
+            datasets=[
+                create_dataset(['_a'], 'RV32A Standard Extension', [], False),
+                create_dataset(['64_a'], 'RV64A Standard Extension (in addition to RV32A)', [], False)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type', 'R4-type', 'I-type', 'S-type'],
+            datasets=[
+                create_dataset(['_f'], 'RV32F Standard Extension', [], False),
+                create_dataset(['64_f'], 'RV64F Standard Extension (in addition to RV32F)', [], False)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type', 'R4-type', 'I-type', 'S-type'],
+            datasets=[
+                create_dataset(['_d'], 'RV32D Standard Extension', [], False),
+                create_dataset(['64_d'], 'RV64D Standard Extension (in addition to RV32D)', [], False)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type', 'R4-type', 'I-type', 'S-type'],
+            datasets=[
+                create_dataset(['_q'], 'RV32Q Standard Extension', [], False),
+                create_dataset(['64_q'], 'RV64Q Standard Extension (in addition to RV32Q)', [], False)
+            ],
+            word_size=32
+        ),
+        create_table_configuration(
+            type_list=['R-type', 'R4-type', 'I-type', 'S-type'],
+            datasets=[
+                create_dataset(['_zfh', '_d_zfh', '_q_zfh'], 'RV32Zfh Standard Extension', [], False),
+                create_dataset(['64_zfh'], 'RV64Zfh Standard Extension (in addition to RV32Zfh)', [], False)
+            ],
+            word_size=32,
+            caption='\\caption{Instruction listing for RISC-V}'
+        ),
+        create_table_configuration(
+            type_list=[''],
+            datasets=[
+                create_dataset(['_c', '32_c', '32_c_f', '_c_d'], 'RV32C Standard Extension', [], False),
+                create_dataset(['64_c'], 'RV64C Standard Extension (in addition to RV32C)', [], False)
+            ],
+            word_size=16,
+            caption=''
+        )
+    ]
+
+
+def create_table_configuration(type_list, datasets, word_size, caption=''):
+    '''
+    Creates a table configuration dictionary with the provided parameters.
+
+    Parameters:
+        type_list (list): List of instruction types to include in the table.
+        datasets (list of tuples): Each tuple contains:
+            - list_of_extensions (list): List of extension names.
+            - title (str): Title to appear as a subsection in the table.
+            - list_of_instructions (list): Specific instructions to include.
+            - include_pseudo_ops (bool): Whether to include pseudo-operations.
+        word_size (int): The word size for the instructions (32 or 16).
+        caption (str): The caption to include at the end of the table.
+
+    Returns:
+        dict: A dictionary representing the table configuration.
+    '''
+    return {
+        "type_list": type_list,
+        "datasets": datasets,
+        "word_size": word_size,
+        "caption": caption
+    }
+
+
+def create_dataset(extensions, title, instructions, include_pseudo_ops):
+    '''
+    Creates a dataset tuple for table configuration.
+
+    Parameters:
+        extensions (list): List of extension names.
+        title (str): Title for the dataset.
+        instructions (list): List of specific instructions to include.
+        include_pseudo_ops (bool): Whether to include pseudo-operations.
+
+    Returns:
+        tuple: A tuple representing the dataset configuration.
+    '''
+    return (extensions, title, instructions, include_pseudo_ops)
+
+
+def make_ext_latex_table(type_list, dataset, latex_file, ilen, caption):
+    '''
+    For a given collection of extensions this function dumps out a complete
+    latex table which includes the encodings of the instructions.
+
+    Args:
+    - type_list (list of str): 
+        1. A list of instruction types (R, I, B, etc) that are treated as header for each table. 
+        2. Each table will have its own requirements and type_list must include all the instruction-types that the table needs.
+        3. All elements of this list must be present in the latex_inst_type dictionary defined in constants.py
+    
+    
+    - dataset (list of tuples): A list of 3-element tuples where each tuple consists of:
+        1. list_of_extensions (list): A list of extensions whose instructions will be populated under the respective title.
+        2. title (str): A title associated with the respective table.
+        3. list_of_instructions (list): If not empty, only these instructions present in the corresponding extension 
+          will be included in the table, while others will be ignored.
+
+    - latex_file (file pointer): A file pointer to the LaTeX file where the generated table will be written.
+    
+    - ilen (int): The ilen input indicates the length of the instruction for which the table is created.
+    
+    - caption (str): The caption for the LaTeX table.
+
+    Returns:
+    - None: The function writes the generated LaTeX table directly to the provided `latex_file`.
+
+    Process:
+    1. Creates table headers based on the instruction types in `type_list` using the `latex_inst_type` dictionary 
+       from constants.py.
+       
+    2. Iterates through each entry in the dataset to:
+       - Generate an exhaustive list of instructions for each dataset using `create_inst_dict`.
+       - Apply any instruction filters based on `list_of_instructions` to select only relevant instructions.
+       
+    3. For each instruction, generates LaTeX table entries.
+       - Uses `arg_lut` from constants.py to determine the position of arguments in the encoding, and creates multicolumn 
+         LaTeX entries for these arguments.
+       - Handles hardcoded bits (e.g., strings of 1s and 0s) similarly, creating multicolumn entries for continuous 
+         strings of bits.
+
+    4. Writes the LaTeX table to `latex_file` with a specific format suitable for instructions of size `ilen`.
+    '''
+
+    column_size = get_column_size(ilen)
+    type_entries = generate_type_entries(ilen)
+    type_dict = get_type_dict(type_list)
+
+    # Build the table entry with each instruction types
+    for inst_type, fields in type_dict.items():
+        type_entries += build_instruction_type_entry(inst_type, fields, ilen)
+
+    # Create a table for each dataset entry
+    content = generate_dataset_content(dataset, ilen)
+
+    header = generate_table_header(column_size, ilen, type_entries)
+    endtable = generate_table_footer(caption)
+
+    # Dump the contents to the latex file
+    latex_file.write(header + content + endtable)
+
+
+def get_column_size(ilen):
+    """Generate the column size string based on instruction length (ilen)."""
+    return "".join(['p{0.002in}'] * (ilen + 1))
+
+
+def generate_type_entries(ilen):
+    """Generate the type entries section of the LaTeX table."""
+    if ilen == 32:
+        return '''
+            \\multicolumn{3}{l}{31} &
+            \\multicolumn{2}{r}{27} &
+            \\multicolumn{1}{c}{26} &
+            \\multicolumn{1}{r}{25} &
+            \\multicolumn{3}{l}{24} &
+            \\multicolumn{2}{r}{20} &
+            \\multicolumn{3}{l}{19} &
+            \\multicolumn{2}{r}{15} &
+            \\multicolumn{2}{l}{14} &
+            \\multicolumn{1}{r}{12} &
+            \\multicolumn{4}{l}{11} &
+            \\multicolumn{1}{r}{7} &
+            \\multicolumn{6}{l}{6} &
+            \\multicolumn{1}{r}{0} \\\\
+            \\cline{2-33}\n&\n\n'''
+    else:
+        return '''
+            \\multicolumn{1}{c}{15} &
+            \\multicolumn{1}{c}{14} &
+            \\multicolumn{1}{c}{13} &
+            \\multicolumn{1}{c}{12} &
+            \\multicolumn{1}{c}{11} &
+            \\multicolumn{1}{c}{10} &
+            \\multicolumn{1}{c}{9} &
+            \\multicolumn{1}{c}{8} &
+            \\multicolumn{1}{c}{7} &
+            \\multicolumn{1}{c}{6} &
+            \\multicolumn{1}{c}{5} &
+            \\multicolumn{1}{c}{4} &
+            \\multicolumn{1}{c}{3} &
+            \\multicolumn{1}{c}{2} &
+            \\multicolumn{1}{c}{1} &
+            \\multicolumn{1}{c}{0} \\\\
+            \\cline{2-17}\n&\n\n'''
+
+
+def get_type_dict(type_list):
+    """Create a subset dictionary of latex_inst_type for the given type_list."""
+    return {key: value for key, value in latex_inst_type.items() if key in type_list}
+
+
+def build_instruction_type_entry(inst_type, fields, ilen):
+    """Build a LaTeX table entry for each instruction type."""
+    entries = []
+    for field in fields['variable_fields']:
+        (msb, lsb) = arg_lut[field]
+        name = latex_mapping.get(field, field)
+        entries.append((msb, lsb, name))
+
+    return format_table_entry(entries, inst_type, ilen)
+
+
+def format_table_entry(fields, entry_type, ilen):
+    """Generate formatted LaTeX table entry."""
+    fields.sort(key=lambda f: f[0], reverse=True)
+    entry = ''
+    for i, (msb, lsb, name) in enumerate(fields):
+        col_size = msb - lsb + 1
+        if i == len(fields) - 1:
+            entry += f'\\multicolumn{{{col_size}}}{{|c|}}{{{name}}} & {entry_type} \\\\\n'
+        elif i == 0:
+            entry += f'\\multicolumn{{{col_size}}}{{|c|}}{{{name}}} &\n'
+        else:
+            entry += f'\\multicolumn{{{col_size}}}{{c|}}{{{name}}} &\n'
+    return entry + f'\\cline{{2-{ilen+1}}}\n&\n\n'
+
+
+def generate_dataset_content(dataset, ilen):
+    """Generate LaTeX content for each dataset entry."""
+    content = ''
+    for ext_list, title, filter_list, include_pseudo in dataset:
+        instr_dict = get_instruction_dict(ext_list, include_pseudo)
+        filtered_list = filter_list if filter_list else list(instr_dict.keys())
+        instr_entries = generate_instruction_entries(instr_dict, filtered_list, ilen)
+
+        if title:
+            content += generate_dataset_title(title, ilen) + instr_entries
+        else:
+            content += instr_entries
+    return content
+
+
+def get_instruction_dict(ext_list, include_pseudo):
+    """Create a dictionary of instructions for given extensions."""
+    instr_dict = {}
+    for ext in ext_list:
+        instr_dict.update(create_inst_dict([f'rv{ext}'], include_pseudo))
+    return instr_dict
+
+
+def generate_instruction_entries(instr_dict, inst_list, ilen):
+    """Generate LaTeX entries for each instruction in the list."""
+    instr_entries = ''
+    for inst in inst_list:
+        if inst not in instr_dict:
+            logging.error(f'Instruction {inst} not found in instr_dict')
+            raise SystemExit(1)
+
+        fields = parse_instruction_fields(instr_dict[inst], ilen)
+        instr_entries += format_table_entry(fields, inst.upper().replace("_", "."), ilen)
+
+    return instr_entries
+
+
+def parse_instruction_fields(inst_data, ilen):
+    """Parse and extract fields from instruction data."""
+    fields = []
+    encoding = inst_data['encoding'][16:] if ilen == 16 else inst_data['encoding']
+    msb = ilen - 1
+    y = ''
+
+    for i in range(ilen):
+        x = encoding[i]
+        if x == '-':
+            if y:
+                fields.append((msb, ilen - i, y))
+                y = ''
+            msb -= 1
+        else:
+            y += str(x)
+
+        if i == ilen - 1 and y:
+            fields.append((msb, 0, y))
+
+    fields.sort(key=lambda f: f[0], reverse=True)
+    return fields
+
+
+def generate_dataset_title(title, ilen):
+    """Generate LaTeX dataset title."""
+    return f'''
+\\multicolumn{{{ilen}}}{{c}}{{}} & \\\\
+\\multicolumn{{{ilen}}}{{c}}{{\\bf {title} }} & \\\\
+\\cline{{2-{ilen + 1}}}
+'''
+
+def generate_table_header(column_size, ilen, type_entries):
+    """Generate LaTeX table header."""
+    return f'''
+\\newpage
+
+\\begin{{table}}[p]
+\\begin{{small}}
+\\begin{{center}}
+    \\begin{{tabular}} {{{column_size}l}}
+    {" ".join(['&'] * ilen)} \\\\
+
+            &
+{type_entries}
+'''
+
+
+def generate_table_footer(caption):
+    """Generate LaTeX table footer."""
+    return f'''
+
+\\end{{tabular}}
+\\end{{center}}
+\\end{{small}}
+{caption}
+\\end{{table}}
+'''
diff --git a/parse.py b/parse.py
index fb0c2e70..586cd66e 100755
--- a/parse.py
+++ b/parse.py
@@ -1,1093 +1,113 @@
 #!/usr/bin/env python3
-
-from constants import *
-import copy
-import re
-import glob
-import os
-import pprint
-import logging
 import collections
-import yaml
+import logging
 import sys
+import yaml
+import pprint
 
-pp = pprint.PrettyPrinter(indent=2)
-logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
-
-def process_enc_line(line, ext):
-    '''
-    This function processes each line of the encoding files (rv*). As part of
-    the processing, the function ensures that the encoding is legal through the
-    following checks::
-
-        - there is no over specification (same bits assigned different values)
-        - there is no under specification (some bits not assigned values)
-        - bit ranges are in the format hi..lo=val where hi > lo
-        - value assigned is representable in the bit range
-        - also checks that the mapping of arguments of an instruction exists in
-          arg_lut.
-
-    If the above checks pass, then the function returns a tuple of the name and
-    a dictionary containing basic information of the instruction which includes:
-        - variables: list of arguments used by the instruction whose mapping
-          exists in the arg_lut dictionary
-        - encoding: this contains the 32-bit encoding of the instruction where
-          '-' is used to represent position of arguments and 1/0 is used to
-          reprsent the static encoding of the bits
-        - extension: this field contains the rv* filename from which this
-          instruction was included
-        - match: hex value representing the bits that need to match to detect
-          this instruction
-        - mask: hex value representin the bits that need to be masked to extract
-          the value required for matching.
-    '''
-    single_dict = {}
-
-    # fill all bits with don't care. we use '-' to represent don't care
-    # TODO: hardcoded for 32-bits.
-    encoding = ['-'] * 32
-
-    # get the name of instruction by splitting based on the first space
-    [name, remaining] = line.split(' ', 1)
-
-    # replace dots with underscores as dot doesn't work with C/Sverilog, etc
-    name = name.replace('.', '_')
-
-    # remove leading whitespaces
-    remaining = remaining.lstrip()
-
-    # check each field for it's length and overlapping bits
-    # ex: 1..0=5 will result in an error --> x<y
-    # ex: 5..0=0 2..1=2 --> overlapping bits
-    for (s2, s1, entry) in fixed_ranges.findall(remaining):
-        msb = int(s2)
-        lsb = int(s1)
-
-        # check msb < lsb
-        if msb < lsb:
-            logging.error(
-                f'{line.split(" ")[0]:<10} has position {msb} less than position {lsb} in it\'s encoding'
-            )
-            raise SystemExit(1)
-
-        # illegal value assigned as per bit width
-        entry_value = int(entry, 0)
-        if entry_value >= (1 << (msb - lsb + 1)):
-            logging.error(
-                f'{line.split(" ")[0]:<10} has an illegal value {entry_value} assigned as per the bit width {msb - lsb}'
-            )
-            raise SystemExit(1)
-
-        for ind in range(lsb, msb + 1):
-            # overlapping bits
-            if encoding[31 - ind] != '-':
-                logging.error(
-                    f'{line.split(" ")[0]:<10} has {ind} bit overlapping in it\'s opcodes'
-                )
-                raise SystemExit(1)
-            bit = str((entry_value >> (ind - lsb)) & 1)
-            encoding[31 - ind] = bit
-
-    # extract bit pattern assignments of the form hi..lo=val
-    remaining = fixed_ranges.sub(' ', remaining)
-
-    # do the same as above but for <lsb>=<val> pattern. single_fixed is a regex
-    # expression present in constants.py
-    for (lsb, value, drop) in single_fixed.findall(remaining):
-        lsb = int(lsb, 0)
-        value = int(value, 0)
-        if encoding[31 - lsb] != '-':
-            logging.error(
-                f'{line.split(" ")[0]:<10} has {lsb} bit overlapping in it\'s opcodes'
-            )
-            raise SystemExit(1)
-        encoding[31 - lsb] = str(value)
-
-    # convert the list of encodings into a single string for match and mask
-    match = "".join(encoding).replace('-','0')
-    mask = "".join(encoding).replace('0','1').replace('-','0')
-
-    # check if all args of the instruction are present in arg_lut present in
-    # constants.py
-    args = single_fixed.sub(' ', remaining).split()
-    encoding_args = encoding.copy()
-    for a in args:
-        if a not in arg_lut:
-            if len(parts := a.split('=')) == 2:
-                existing_arg, new_arg = parts
-                if existing_arg in arg_lut:
-                    arg_lut[a] = arg_lut[existing_arg]
-                
-                else:
-                    logging.error(f' Found field {existing_arg} in variable {a} in instruction {name} whose mapping in arg_lut does not exist')
-                    raise SystemExit(1)
-            else:
-                logging.error(f' Found variable {a} in instruction {name} whose mapping in arg_lut does not exist')
-                raise SystemExit(1)
-        (msb, lsb) = arg_lut[a]
-        for ind in range(lsb, msb + 1):
-            # overlapping bits
-            if encoding_args[31 - ind] != '-':
-                logging.error(f' Found variable {a} in instruction {name} overlapping {encoding_args[31 - ind]} variable in bit {ind}')
-                raise SystemExit(1)
-            encoding_args[31 - ind] = a
-
-
-    # update the fields of the instruction as a dict and return back along with
-    # the name of the instruction
-    single_dict['encoding'] = "".join(encoding)
-    single_dict['variable_fields'] = args
-    single_dict['extension'] = [os.path.basename(ext)]
-    single_dict['match']=hex(int(match,2))
-    single_dict['mask']=hex(int(mask,2))
-
-    return (name, single_dict)
-
-def same_base_isa(ext_name, ext_name_list):
-    type1 = ext_name.split("_")[0]
-    for ext_name1 in ext_name_list:
-        type2 = ext_name1.split("_")[0]
-        # "rv" mean insn for rv32 and rv64
-        if (type1 == type2 or
-            (type2 == "rv" and (type1 == "rv32" or type1 == "rv64")) or
-            (type1 == "rv" and (type2 == "rv32" or type2 == "rv64"))):
-            return True
-    return False
-
-def overlaps(x, y):
-    x = x.rjust(len(y), '-')
-    y = y.rjust(len(x), '-')
-
-    for i in range(0, len(x)):
-        if not (x[i] == '-' or y[i] == '-' or x[i] == y[i]):
-            return False
-
-    return True
-
-def overlap_allowed(a, x, y):
-    return x in a and y in a[x] or \
-           y in a and x in a[y]
-
-def extension_overlap_allowed(x, y):
-    return overlap_allowed(overlapping_extensions, x, y)
-
-def instruction_overlap_allowed(x, y):
-    return overlap_allowed(overlapping_instructions, x, y)
-
-def add_segmented_vls_insn(instr_dict):
-    updated_dict = {}
-    for k, v in instr_dict.items():
-        if "nf" in v['variable_fields']:
-            for new_key, new_value in expand_nf_field(k,v):
-                updated_dict[new_key] = new_value
-        else:
-            updated_dict[k] = v
-    return updated_dict
-
-def expand_nf_field(name, single_dict):
-    if "nf" not in single_dict['variable_fields']:
-        logging.error(f"Cannot expand nf field for instruction {name}")
-        raise SystemExit(1)
-
-    # nf no longer a variable field
-    single_dict['variable_fields'].remove("nf")
-    # include nf in mask
-    single_dict['mask'] = hex(int(single_dict['mask'],16) | 0b111 << 29)
-
-    name_expand_index = name.find('e')
-    expanded_instructions = []
-    for nf in range(0,8):
-        new_single_dict = copy.deepcopy(single_dict)
-        new_single_dict['match'] = hex(int(single_dict['match'],16) | nf << 29)
-        new_single_dict['encoding'] = format(nf, '03b') + single_dict['encoding'][3:]
-        new_name = name if nf == 0 else name[:name_expand_index] + "seg" + str(nf+1) + name[name_expand_index:]
-        expanded_instructions.append((new_name, new_single_dict))
-    return expanded_instructions
-
-
-def create_inst_dict(file_filter, include_pseudo=False, include_pseudo_ops=[]):
-    '''
-    This function return a dictionary containing all instructions associated
-    with an extension defined by the file_filter input. The file_filter input
-    needs to be rv* file name with out the 'rv' prefix i.e. '_i', '32_i', etc.
-
-    Each node of the dictionary will correspond to an instruction which again is
-    a dictionary. The dictionary contents of each instruction includes:
-        - variables: list of arguments used by the instruction whose mapping
-          exists in the arg_lut dictionary
-        - encoding: this contains the 32-bit encoding of the instruction where
-          '-' is used to represent position of arguments and 1/0 is used to
-          reprsent the static encoding of the bits
-        - extension: this field contains the rv* filename from which this
-          instruction was included
-        - match: hex value representing the bits that need to match to detect
-          this instruction
-        - mask: hex value representin the bits that need to be masked to extract
-          the value required for matching.
-
-    In order to build this dictionary, the function does 2 passes over the same
-    rv<file_filter> file. The first pass is to extract all standard
-    instructions. In this pass, all pseudo ops and imported instructions are
-    skipped. For each selected line of the file, we call process_enc_line
-    function to create the above mentioned dictionary contents of the
-    instruction. Checks are performed in this function to ensure that the same
-    instruction is not added twice to the overall dictionary.
-
-    In the second pass, this function parses only pseudo_ops. For each pseudo_op
-    this function checks if the dependent extension and instruction, both, exist
-    before parsing it. The pseudo op is only added to the overall dictionary if
-    the dependent instruction is not present in the dictionary, else it is
-    skipped.
-
-
-    '''
-    opcodes_dir = os.path.dirname(os.path.realpath(__file__))
-    instr_dict = {}
-
-    # file_names contains all files to be parsed in the riscv-opcodes directory
-    file_names = []
-    for fil in file_filter:
-        file_names += glob.glob(f'{opcodes_dir}/{fil}')
-    file_names.sort(reverse=True)
-    # first pass if for standard/regular instructions
-    logging.debug('Collecting standard instructions first')
-    for f in file_names:
-        logging.debug(f'Parsing File: {f} for standard instructions')
-        with open(f) as fp:
-            lines = (line.rstrip()
-                     for line in fp)  # All lines including the blank ones
-            lines = list(line for line in lines if line)  # Non-blank lines
-            lines = list(
-                line for line in lines
-                if not line.startswith("#"))  # remove comment lines
-
-        # go through each line of the file
-        for line in lines:
-            # if the an instruction needs to be imported then go to the
-            # respective file and pick the line that has the instruction.
-            # The variable 'line' will now point to the new line from the
-            # imported file
-
-            # ignore all lines starting with $import and $pseudo
-            if '$import' in line or '$pseudo' in line:
-                continue
-            logging.debug(f'     Processing line: {line}')
-
-            # call process_enc_line to get the data about the current
-            # instruction
-            (name, single_dict) = process_enc_line(line, f)
-            ext_name = os.path.basename(f)
-
-            # if an instruction has already been added to the filtered
-            # instruction dictionary throw an error saying the given
-            # instruction is already imported and raise SystemExit
-            if name in instr_dict:
-                var = instr_dict[name]["extension"]
-                if same_base_isa(ext_name, var):
-                    # disable same names on the same base ISA
-                    err_msg = f'instruction : {name} from '
-                    err_msg += f'{ext_name} is already '
-                    err_msg += f'added from {var} in same base ISA'
-                    logging.error(err_msg)
-                    raise SystemExit(1)
-                elif instr_dict[name]['encoding'] != single_dict['encoding']:
-                    # disable same names with different encodings on different base ISAs
-                    err_msg = f'instruction : {name} from '
-                    err_msg += f'{ext_name} is already '
-                    err_msg += f'added from {var} but each have different encodings in different base ISAs'
-                    logging.error(err_msg)
-                    raise SystemExit(1)
-                instr_dict[name]['extension'].extend(single_dict['extension'])
-            else:
-              for key in instr_dict:
-                  item = instr_dict[key]
-                  if overlaps(item['encoding'], single_dict['encoding']) and \
-                    not extension_overlap_allowed(ext_name, item['extension'][0]) and \
-                    not instruction_overlap_allowed(name, key) and \
-                    same_base_isa(ext_name, item['extension']):
-                      # disable different names with overlapping encodings on the same base ISA
-                      err_msg = f'instruction : {name} in extension '
-                      err_msg += f'{ext_name} overlaps instruction {key} '
-                      err_msg += f'in extension {item["extension"]}'
-                      logging.error(err_msg)
-                      raise SystemExit(1)
-
-            if name not in instr_dict:
-                # update the final dict with the instruction
-                instr_dict[name] = single_dict
-
-    # second pass if for pseudo instructions
-    logging.debug('Collecting pseudo instructions now')
-    for f in file_names:
-        logging.debug(f'Parsing File: {f} for pseudo_ops')
-        with open(f) as fp:
-            lines = (line.rstrip()
-                     for line in fp)  # All lines including the blank ones
-            lines = list(line for line in lines if line)  # Non-blank lines
-            lines = list(
-                line for line in lines
-                if not line.startswith("#"))  # remove comment lines
-
-        # go through each line of the file
-        for line in lines:
-
-            # ignore all lines not starting with $pseudo
-            if '$pseudo' not in line:
-                continue
-            logging.debug(f'     Processing line: {line}')
-
-            # use the regex pseudo_regex from constants.py to find the dependent
-            # extension, dependent instruction, the pseudo_op in question and
-            # its encoding
-            (ext, orig_inst, pseudo_inst, line) = pseudo_regex.findall(line)[0]
-            ext_file = f'{opcodes_dir}/{ext}'
-
-            # check if the file of the dependent extension exist. Throw error if
-            # it doesn't
-            if not os.path.exists(ext_file):
-                ext1_file = f'{opcodes_dir}/unratified/{ext}'
-                if not os.path.exists(ext1_file):
-                    logging.error(f'Pseudo op {pseudo_inst} in {f} depends on {ext} which is not available')
-                    raise SystemExit(1)
-                else:
-                    ext_file = ext1_file
-
-            # check if the dependent instruction exist in the dependent
-            # extension. Else throw error.
-            found = False
-            for oline in open(ext_file):
-                if not re.findall(f'^\\s*{orig_inst}\\s+',oline):
-                    continue
-                else:
-                    found = True
-                    break
-            if not found:
-                logging.error(f'Orig instruction {orig_inst} not found in {ext}. Required by pseudo_op {pseudo_inst} present in {f}')
-                raise SystemExit(1)
-
-
-            (name, single_dict) = process_enc_line(pseudo_inst + ' ' + line, f)
-            # add the pseudo_op to the dictionary only if the original
-            # instruction is not already in the dictionary.
-            if orig_inst.replace('.','_') not in instr_dict \
-                    or include_pseudo \
-                    or name in include_pseudo_ops:
-
-                # update the final dict with the instruction
-                if name not in instr_dict:
-                    instr_dict[name] = single_dict
-                    logging.debug(f'        including pseudo_ops:{name}')
-                else:
-                    if(single_dict['match'] != instr_dict[name]['match']):
-                        instr_dict[name + '_pseudo'] = single_dict
-
-                    # if a pseudo instruction has already been added to the filtered
-                    # instruction dictionary but the extension is not in the current
-                    # list, add it
-                    else:
-                        ext_name = single_dict['extension']
-
-                    if (ext_name not in instr_dict[name]['extension']) & (name + '_pseudo' not in instr_dict):
-                        instr_dict[name]['extension'].extend(ext_name)
-            else:
-                logging.debug(f'        Skipping pseudo_op {pseudo_inst} since original instruction {orig_inst} already selected in list')
-
-    # third pass if for imported instructions
-    logging.debug('Collecting imported instructions')
-    for f in file_names:
-        logging.debug(f'Parsing File: {f} for imported ops')
-        with open(f) as fp:
-            lines = (line.rstrip()
-                     for line in fp)  # All lines including the blank ones
-            lines = list(line for line in lines if line)  # Non-blank lines
-            lines = list(
-                line for line in lines
-                if not line.startswith("#"))  # remove comment lines
-
-        # go through each line of the file
-        for line in lines:
-            # if the an instruction needs to be imported then go to the
-            # respective file and pick the line that has the instruction.
-            # The variable 'line' will now point to the new line from the
-            # imported file
-
-            # ignore all lines starting with $import and $pseudo
-            if '$import' not in line :
-                continue
-            logging.debug(f'     Processing line: {line}')
-
-            (import_ext, reg_instr) = imported_regex.findall(line)[0]
-            import_ext_file = f'{opcodes_dir}/{import_ext}'
-
-            # check if the file of the dependent extension exist. Throw error if
-            # it doesn't
-            if not os.path.exists(import_ext_file):
-                ext1_file = f'{opcodes_dir}/unratified/{import_ext}'
-                if not os.path.exists(ext1_file):
-                    logging.error(f'Instruction {reg_instr} in {f} cannot be imported from {import_ext}')
-                    raise SystemExit(1)
-                else:
-                    ext_file = ext1_file
-            else:
-                ext_file = import_ext_file
-
-            # check if the dependent instruction exist in the dependent
-            # extension. Else throw error.
-            found = False
-            for oline in open(ext_file):
-                if not re.findall(f'^\\s*{reg_instr}\\s+',oline):
-                    continue
-                else:
-                    found = True
-                    break
-            if not found:
-                logging.error(f'imported instruction {reg_instr} not found in {ext_file}. Required by {line} present in {f}')
-                logging.error(f'Note: you cannot import pseudo/imported ops.')
-                raise SystemExit(1)
-
-            # call process_enc_line to get the data about the current
-            # instruction
-            (name, single_dict) = process_enc_line(oline, f)
-
-            # if an instruction has already been added to the filtered
-            # instruction dictionary throw an error saying the given
-            # instruction is already imported and raise SystemExit
-            if name in instr_dict:
-                var = instr_dict[name]["extension"]
-                if instr_dict[name]['encoding'] != single_dict['encoding']:
-                    err_msg = f'imported instruction : {name} in '
-                    err_msg += f'{os.path.basename(f)} is already '
-                    err_msg += f'added from {var} but each have different encodings for the same instruction'
-                    logging.error(err_msg)
-                    raise SystemExit(1)
-                instr_dict[name]['extension'].extend(single_dict['extension'])
-            else:
-                # update the final dict with the instruction
-                instr_dict[name] = single_dict
-    return instr_dict
-
-def make_priv_latex_table():
-    latex_file = open('priv-instr-table.tex','w')
-    type_list = ['R-type','I-type']
-    system_instr = ['_h','_s','_system','_svinval', '64_h']
-    dataset_list = [ (system_instr, 'Trap-Return Instructions',['sret','mret'], False) ]
-    dataset_list.append((system_instr, 'Interrupt-Management Instructions',['wfi'], False))
-    dataset_list.append((system_instr, 'Supervisor Memory-Management Instructions',['sfence_vma'], False))
-    dataset_list.append((system_instr, 'Hypervisor Memory-Management Instructions',['hfence_vvma', 'hfence_gvma'], False))
-    dataset_list.append((system_instr, 'Hypervisor Virtual-Machine Load and Store Instructions',
-        ['hlv_b','hlv_bu', 'hlv_h','hlv_hu', 'hlv_w', 'hlvx_hu', 'hlvx_wu', 'hsv_b', 'hsv_h','hsv_w'], False))
-    dataset_list.append((system_instr, 'Hypervisor Virtual-Machine Load and Store Instructions, RV64 only', ['hlv_wu','hlv_d','hsv_d'], False))
-    dataset_list.append((system_instr, 'Svinval Memory-Management Instructions', ['sinval_vma', 'sfence_w_inval','sfence_inval_ir', 'hinval_vvma','hinval_gvma'], False))
-    caption = '\\caption{RISC-V Privileged Instructions}'
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    latex_file.close()
-
-def make_latex_table():
-    '''
-    This function is mean to create the instr-table.tex that is meant to be used
-    by the riscv-isa-manual. This function basically creates a single latext
-    file of multiple tables with each table limited to a single page. Only the
-    last table is assigned a latex-caption.
-
-    For each table we assign a type-list which capture the different instruction
-    types (R, I, B, etc) that will be required for the table. Then we select the
-    list of extensions ('_i, '32_i', etc) whose instructions are required to
-    populate the table. For each extension or collection of extension we can
-    assign Title, such that in the end they appear as subheadings within
-    the table (note these are inlined headings and not captions of the table).
-
-    All of the above information is collected/created and sent to
-    make_ext_latex_table function to dump out the latex contents into a file.
-
-    The last table only has to be given a caption - as per the policy of the
-    riscv-isa-manual.
-    '''
-    # open the file and use it as a pointer for all further dumps
-    latex_file = open('instr-table.tex','w')
-
-    # create the rv32i table first. Here we set the caption to empty. We use the
-    # files rv_i and rv32_i to capture instructions relevant for rv32i
-    # configuration. The dataset is a list of 4-element tuples :
-    # (list_of_extensions, title, list_of_instructions, include_pseudo_ops). If list_of_instructions
-    # is empty then it indicates that all instructions of the all the extensions
-    # in list_of_extensions need to be dumped. If not empty, then only the
-    # instructions listed in list_of_instructions will be dumped into latex.
-    caption = ''
-    type_list = ['R-type','I-type','S-type','B-type','U-type','J-type']
-    dataset_list = [(['_i','32_i'], 'RV32I Base Instruction Set', [], False)]
-    dataset_list.append((['_i'], '', ['fence_tso','pause'], True))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    type_list = ['R-type','I-type','S-type']
-    dataset_list = [(['64_i'], 'RV64I Base Instruction Set (in addition to RV32I)', [], False)]
-    dataset_list.append((['_zifencei'], 'RV32/RV64 Zifencei Standard Extension', [], False))
-    dataset_list.append((['_zicsr'], 'RV32/RV64 Zicsr Standard Extension', [], False))
-    dataset_list.append((['_m','32_m'], 'RV32M Standard Extension', [], False))
-    dataset_list.append((['64_m'],'RV64M Standard Extension (in addition to RV32M)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    type_list = ['R-type']
-    dataset_list = [(['_a'],'RV32A Standard Extension', [], False)]
-    dataset_list.append((['64_a'],'RV64A Standard Extension (in addition to RV32A)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    type_list = ['R-type','R4-type','I-type','S-type']
-    dataset_list = [(['_f'],'RV32F Standard Extension', [], False)]
-    dataset_list.append((['64_f'],'RV64F Standard Extension (in addition to RV32F)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    type_list = ['R-type','R4-type','I-type','S-type']
-    dataset_list = [(['_d'],'RV32D Standard Extension', [], False)]
-    dataset_list.append((['64_d'],'RV64D Standard Extension (in addition to RV32D)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    type_list = ['R-type','R4-type','I-type','S-type']
-    dataset_list = [(['_q'],'RV32Q Standard Extension', [], False)]
-    dataset_list.append((['64_q'],'RV64Q Standard Extension (in addition to RV32Q)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    caption = '\\caption{Instruction listing for RISC-V}'
-    type_list = ['R-type','R4-type','I-type','S-type']
-    dataset_list = [(['_zfh', '_d_zfh','_q_zfh'],'RV32Zfh Standard Extension', [], False)]
-    dataset_list.append((['64_zfh'],'RV64Zfh Standard Extension (in addition to RV32Zfh)', [], False))
-    make_ext_latex_table(type_list, dataset_list, latex_file, 32, caption)
-
-    ## The following is demo to show that Compressed instructions can also be
-    # dumped in the same manner as above
-
-    #type_list = ['']
-    #dataset_list = [(['_c', '32_c', '32_c_f','_c_d'],'RV32C Standard Extension', [])]
-    #dataset_list.append((['64_c'],'RV64C Standard Extension (in addition to RV32C)', []))
-    #make_ext_latex_table(type_list, dataset_list, latex_file, 16, caption)
-
-    latex_file.close()
-
-def make_ext_latex_table(type_list, dataset, latex_file, ilen, caption):
-    '''
-    For a given collection of extensions this function dumps out a complete
-    latex table which includes the encodings of the instructions.
-
-    The ilen input indicates the length of the instruction for which the table
-    is created.
-
-    The caption input is used to create the latex-table caption.
-
-    The type_list input is a list of instruction types (R, I, B, etc) that are
-    treated as header for each table. Each table will have its own requirements
-    and type_list must include all the instruction-types that the table needs.
-    Note, all elements of this list must be present in the latex_inst_type
-    dictionary defined in constants.py
-
-    The latex_file is a file pointer to which the latex-table will dumped into
-
-    The dataset is a list of 3-element tuples containing:
-        (list_of_extensions, title, list_of_instructions)
-    The list_of_extensions must contain all the set of extensions whose
-    instructions must be populated under a given title. If list_of_instructions
-    is not empty, then only those instructions mentioned in list_of_instructions
-    present in the extension will be dumped into the latex-table, other
-    instructions will be ignored.
-
-    Once the above inputs are received then function first creates table entries
-    for the instruction types. To simplify things, we maintain a dictionary
-    called latex_inst_type in constants.py which is created in the same way the
-    instruction dictionary is created. This allows us to re-use the same logic
-    to create the instruction types table as well
-
-    Once the header is created, we then parse through every entry in the
-    dataset. For each list dataset entry we use the create_inst_dict function to
-    create an exhaustive list of instructions associated with the respective
-    collection of the extension of that dataset. Then we apply the instruction
-    filter, if any, indicated by the list_of_instructions of that dataset.
-    Thereon, for each instruction we create a latex table entry.
-
-    Latex table specification for ilen sized instructions:
-        Each table is created with ilen+1 columns - ilen columns for each bit of the
-        instruction and one column to hold the name of the instruction.
-
-        For each argument of an instruction we use the arg_lut from constants.py
-        to identify its position in the encoding, and thus create a multicolumn
-        entry with the name of the argument as the data. For hardcoded bits, we
-        do the same where we capture a string of continuous 1s and 0s, identify
-        the position and assign the same string as the data of the
-        multicolumn entry in the table.
-
-    '''
-    column_size = "".join(['p{0.002in}']*(ilen+1))
-
-    type_entries = '''
-    \\multicolumn{3}{l}{31} &
-    \\multicolumn{2}{r}{27} &
-    \\multicolumn{1}{c}{26} &
-    \\multicolumn{1}{r}{25} &
-    \\multicolumn{3}{l}{24} &
-    \\multicolumn{2}{r}{20} &
-    \\multicolumn{3}{l}{19} &
-    \\multicolumn{2}{r}{15} &
-    \\multicolumn{2}{l}{14} &
-    \\multicolumn{1}{r}{12} &
-    \\multicolumn{4}{l}{11} &
-    \\multicolumn{1}{r}{7} &
-    \\multicolumn{6}{l}{6} &
-    \\multicolumn{1}{r}{0} \\\\
-    \\cline{2-33}\n&\n\n
-''' if ilen == 32 else '''
-    \\multicolumn{1}{c}{15} &
-    \\multicolumn{1}{c}{14} &
-    \\multicolumn{1}{c}{13} &
-    \\multicolumn{1}{c}{12} &
-    \\multicolumn{1}{c}{11} &
-    \\multicolumn{1}{c}{10} &
-    \\multicolumn{1}{c}{9} &
-    \\multicolumn{1}{c}{8} &
-    \\multicolumn{1}{c}{7} &
-    \\multicolumn{1}{c}{6} &
-    \\multicolumn{1}{c}{5} &
-    \\multicolumn{1}{c}{4} &
-    \\multicolumn{1}{c}{3} &
-    \\multicolumn{1}{c}{2} &
-    \\multicolumn{1}{c}{1} &
-    \\multicolumn{1}{c}{0} \\\\
-    \\cline{2-17}\n&\n\n
-'''
-
-    # depending on the type_list input we create a subset dictionary of
-    # latex_inst_type dictionary present in constants.py
-    type_dict = {key: value for key, value in latex_inst_type.items() if key in type_list}
-
-    # iterate ovr each instruction type and create a table entry
-    for t in type_dict:
-        fields = []
-
-        # first capture all "arguments" of the type (funct3, funct7, rd, etc)
-        # and capture their positions using arg_lut.
-        for f in type_dict[t]['variable_fields']:
-            (msb, lsb) = arg_lut[f]
-            name = f if f not in latex_mapping else latex_mapping[f]
-            fields.append((msb, lsb, name))
-
-        # iterate through the 32 bits, starting from the msb, and assign
-        # argument names to the relevant portions of the instructions. This
-        # information is stored as a 3-element tuple containing the msb, lsb
-        # position of the arugment and the name of the argument.
-        msb = ilen - 1
-        y = ''
-        for r in range(0,ilen):
-            if y != '':
-                fields.append((msb,ilen-1-r+1,y))
-                y = ''
-            msb = ilen-1-r-1
-            if r == 31:
-                if y != '':
-                    fields.append((msb, 0, y))
-                y = ''
-
-        # sort the arguments in decreasing order of msb position
-        fields.sort(key=lambda y: y[0], reverse=True)
-
-        # for each argument/string of 1s or 0s, create a multicolumn latex table
-        # entry
-        entry = ''
-        for r in range(len(fields)):
-            (msb, lsb, name) = fields[r]
-            if r == len(fields)-1:
-                entry += f'\\multicolumn{{{msb - lsb + 1}}}{{|c|}}{{{name}}} & {t} \\\\\n'
-            elif r == 0:
-                entry += f'\\multicolumn{{{msb - lsb + 1}}}{{|c|}}{{{name}}} &\n'
-            else:
-                entry += f'\\multicolumn{{{msb - lsb + 1}}}{{c|}}{{{name}}} &\n'
-        entry += f'\\cline{{2-{ilen+1}}}\n&\n\n'
-        type_entries += entry
-
-    # for each entry in the dataset create a table
-    content = ''
-    for (ext_list, title, filter_list, include_pseudo) in dataset:
-        instr_dict = {}
-
-        # for all extensions list in ext_list, create a dictionary of
-        # instructions associated with those extensions.
-        for e in ext_list:
-            instr_dict.update(create_inst_dict(['rv'+e], include_pseudo))
-
-        # if filter_list is not empty then use that as the official set of
-        # instructions that need to be dumped into the latex table
-        inst_list = list(instr_dict.keys()) if not filter_list else filter_list
-
-        # for each instruction create an latex table entry just like how we did
-        # above with the instruction-type table.
-        instr_entries = ''
-        for inst in inst_list:
-            if inst not in instr_dict:
-                logging.error(f'in make_ext_latex_table: Instruction: {inst} not found in instr_dict')
-                raise SystemExit(1)
-            fields = []
-
-            # only if the argument is available in arg_lut we consume it, else
-            # throw error.
-            for f in instr_dict[inst]['variable_fields']:
-                if f not in arg_lut:
-                    logging.error(f'Found variable {f} in instruction {inst} whose mapping is not available')
-                    raise SystemExit(1)
-                (msb,lsb) = arg_lut[f]
-                name = f.replace('_','.') if f not in latex_mapping else latex_mapping[f]
-                fields.append((msb, lsb, name))
-
-            msb = ilen -1
-            y = ''
-            if ilen == 16:
-                encoding = instr_dict[inst]['encoding'][16:]
-            else:
-                encoding = instr_dict[inst]['encoding']
-            for r in range(0,ilen):
-                x = encoding [r]
-                if ((msb, ilen-1-r+1)) in latex_fixed_fields:
-                    fields.append((msb,ilen-1-r+1,y))
-                    msb = ilen-1-r
-                    y = ''
-                if x == '-':
-                    if y != '':
-                        fields.append((msb,ilen-1-r+1,y))
-                        y = ''
-                    msb = ilen-1-r-1
-                else:
-                    y += str(x)
-                if r == ilen-1:
-                    if y != '':
-                        fields.append((msb, 0, y))
-                    y = ''
-
-            fields.sort(key=lambda y: y[0], reverse=True)
-            entry = ''
-            for r in range(len(fields)):
-                (msb, lsb, name) = fields[r]
-                if r == len(fields)-1:
-                    entry += f'\\multicolumn{{{msb - lsb + 1}}}{{|c|}}{{{name}}} & {inst.upper().replace("_",".")} \\\\\n'
-                elif r == 0:
-                    entry += f'\\multicolumn{{{msb - lsb + 1}}}{{|c|}}{{{name}}} &\n'
+from constants import *  
+from shared_utils import create_inst_dict, add_segmented_vls_insn
+from latex_utils import make_latex_table, make_priv_latex_table
+from chisel_utils import make_chisel
+from rust_utils import make_rust
+from sverilog_utils import make_sverilog
+from c_utils import make_c
+from go_utils import make_go
+
+LOG_FORMAT = '%(levelname)s:: %(message)s'
+LOG_LEVEL = logging.INFO
+
+pretty_printer = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=LOG_LEVEL, format=LOG_FORMAT)
+
+def remove_non_extensions(args):
+    """
+    Removes non-extension flags from the command-line arguments.
+    """
+    extensions = args[1:]
+    flags = ['-c', '-latex', '-chisel', '-sverilog', '-rust', '-go', '-spinalhdl']
+    return [ext for ext in extensions if ext not in flags]
+
+def process_instruction_dict(extensions, include_pseudo):
+    """
+    Processes the instruction dictionary by creating and adding segmented instructions.
+    """
+    instr_dict = create_inst_dict(extensions, include_pseudo)
+    instr_dict = add_segmented_vls_insn(instr_dict)
+    return collections.OrderedDict(sorted(instr_dict.items()))
+
+def write_yaml(instr_dict, filename='instr_dict.yaml'):
+    """
+    Writes the instruction dictionary to a YAML file.
+    """
+    with open(filename, 'w') as outfile:
+        yaml.dump(instr_dict, outfile, default_flow_style=False)
+
+def generate_outputs(instr_dict, extensions):
+    """
+    Generates output files based on selected extensions and flags.
+    """
+    # Dictionary to map extensions to their respective functions and logging messages
+    extension_map = {
+        '-c': {
+            'function': lambda: make_c(collections.OrderedDict(sorted(create_inst_dict(extensions, False, include_pseudo_ops=emitted_pseudo_ops).items()))),
+            'message': 'encoding.out.h generated successfully'
+        },
+        '-chisel': {
+            'function': lambda: make_chisel(instr_dict),
+            'message': 'inst.chisel generated successfully'
+        },
+        '-spinalhdl': {
+            'function': lambda: make_chisel(instr_dict, spinal_hdl=True),
+            'message': 'inst.spinalhdl generated successfully'
+        },
+        '-sverilog': {
+            'function': lambda: make_sverilog(instr_dict),
+            'message': 'inst.sverilog generated successfully'
+        },
+        '-rust': {
+            'function': lambda: make_rust(instr_dict),
+            'message': 'inst.rs generated successfully'
+        },
+        '-go': {
+            'function': lambda: make_go(instr_dict),
+            'message': 'inst.go generated successfully'
+        },
+        '-latex': {
+            'function': lambda: (make_latex_table(), make_priv_latex_table()),
+            'message': [
+                'instr-table.tex generated successfully',
+                'priv-instr-table.tex generated successfully'
+            ]
+        }
+    }
+
+    for ext, actions in extension_map.items():
+        if ext in extensions:
+            try:
+                actions['function']()                
+                if isinstance(actions['message'], list):
+                    for msg in actions['message']:
+                        logging.info(msg)
                 else:
-                    entry += f'\\multicolumn{{{msb - lsb + 1}}}{{c|}}{{{name}}} &\n'
-            entry += f'\\cline{{2-{ilen+1}}}\n&\n\n'
-            instr_entries += entry
-
-        # once an entry of the dataset is completed we create the whole table
-        # with the title of that dataset as sub-heading (sort-of)
-        if title != '':
-            content += f'''
-
-\\multicolumn{{{ilen}}}{{c}}{{}} & \\\\
-\\multicolumn{{{ilen}}}{{c}}{{\\bf {title} }} & \\\\
-\\cline{{2-{ilen+1}}}
-
-            &
-{instr_entries}
-'''
-        else:
-            content += f'''
-{instr_entries}
-'''
-
-
-    header = f'''
-\\newpage
-
-\\begin{{table}}[p]
-\\begin{{small}}
-\\begin{{center}}
-    \\begin{{tabular}} {{{column_size}l}}
-    {" ".join(['&']*ilen)} \\\\
+                    logging.info(actions['message'])
 
-            &
-{type_entries}
-'''
-    endtable=f'''
+            except Exception as e:
+                logging.error(f"Error generating output for {ext}: {e}")
 
-\\end{{tabular}}
-\\end{{center}}
-\\end{{small}}
-{caption}
-\\end{{table}}
-'''
-    # dump the contents and return
-    latex_file.write(header+content+endtable)
-
-def instr_dict_2_extensions(instr_dict):
-    extensions = []
-    for item in instr_dict.values():
-        if item['extension'][0] not in extensions:
-            extensions.append(item['extension'][0])
-    return extensions
-
-def make_chisel(instr_dict, spinal_hdl=False):
-
-    chisel_names=''
-    cause_names_str=''
-    csr_names_str = ''
-    for i in instr_dict:
-        if spinal_hdl:
-            chisel_names += f'  def {i.upper().replace(".","_"):<18s} = M"b{instr_dict[i]["encoding"].replace("-","-")}"\n'
-        # else:
-        #     chisel_names += f'  def {i.upper().replace(".","_"):<18s} = BitPat("b{instr_dict[i]["encoding"].replace("-","?")}")\n'
-    if not spinal_hdl:
-        extensions = instr_dict_2_extensions(instr_dict)
-        for e in extensions:
-            e_instrs = filter(lambda i: instr_dict[i]['extension'][0] == e, instr_dict)
-            if "rv64_" in e:
-                e_format = e.replace("rv64_", "").upper() + "64"
-            elif "rv32_" in e:
-                e_format = e.replace("rv32_", "").upper() + "32"
-            elif "rv_" in e:
-                e_format = e.replace("rv_", "").upper()
-            else:
-                e_format = e.upper
-            chisel_names += f'  val {e_format+"Type"} = Map(\n'
-            for instr in e_instrs:
-                tmp_instr_name = '"'+instr.upper().replace(".","_")+'"'
-                chisel_names += f'   {tmp_instr_name:<18s} -> BitPat("b{instr_dict[instr]["encoding"].replace("-","?")}"),\n'
-            chisel_names += f'  )\n'
-
-    for num, name in causes:
-        cause_names_str += f'  val {name.lower().replace(" ","_")} = {hex(num)}\n'
-    cause_names_str += '''  val all = {
-    val res = collection.mutable.ArrayBuffer[Int]()
-'''
-    for num, name in causes:
-        cause_names_str += f'    res += {name.lower().replace(" ","_")}\n'
-    cause_names_str += '''    res.toArray
-  }'''
-
-    for num, name in csrs+csrs32:
-        csr_names_str += f'  val {name} = {hex(num)}\n'
-    csr_names_str += '''  val all = {
-    val res = collection.mutable.ArrayBuffer[Int]()
-'''
-    for num, name in csrs:
-        csr_names_str += f'''    res += {name}\n'''
-    csr_names_str += '''    res.toArray
-  }
-  val all32 = {
-    val res = collection.mutable.ArrayBuffer(all:_*)
-'''
-    for num, name in csrs32:
-        csr_names_str += f'''    res += {name}\n'''
-    csr_names_str += '''    res.toArray
-  }'''
-
-    if spinal_hdl:
-        chisel_file = open('inst.spinalhdl','w')
-    else:
-        chisel_file = open('inst.chisel','w')
-    chisel_file.write(f'''
-/* Automatically generated by parse_opcodes */
-object Instructions {{
-{chisel_names}
-}}
-object Causes {{
-{cause_names_str}
-}}
-object CSRs {{
-{csr_names_str}
-}}
-''')
-    chisel_file.close()
-
-def make_rust(instr_dict):
-    mask_match_str= ''
-    for i in instr_dict:
-        mask_match_str += f'const MATCH_{i.upper().replace(".","_")}: u32 = {(instr_dict[i]["match"])};\n'
-        mask_match_str += f'const MASK_{i.upper().replace(".","_")}: u32 = {(instr_dict[i]["mask"])};\n'
-    for num, name in csrs+csrs32:
-        mask_match_str += f'const CSR_{name.upper()}: u16 = {hex(num)};\n'
-    for num, name in causes:
-        mask_match_str += f'const CAUSE_{name.upper().replace(" ","_")}: u8 = {hex(num)};\n'
-    rust_file = open('inst.rs','w')
-    rust_file.write(f'''
-/* Automatically generated by parse_opcodes */
-{mask_match_str}
-''')
-    rust_file.close()
-
-def make_sverilog(instr_dict):
-    names_str = ''
-    for i in instr_dict:
-        names_str += f"  localparam [31:0] {i.upper().replace('.','_'):<18s} = 32'b{instr_dict[i]['encoding'].replace('-','?')};\n"
-    names_str += '  /* CSR Addresses */\n'
-    for num, name in csrs+csrs32:
-        names_str += f"  localparam logic [11:0] CSR_{name.upper()} = 12'h{hex(num)[2:]};\n"
-
-    sverilog_file = open('inst.sverilog','w')
-    sverilog_file.write(f'''
-/* Automatically generated by parse_opcodes */
-package riscv_instr;
-{names_str}
-endpackage
-''')
-    sverilog_file.close()
-def make_c(instr_dict):
-    mask_match_str = ''
-    declare_insn_str = ''
-    for i in instr_dict:
-        mask_match_str += f'#define MATCH_{i.upper().replace(".","_")} {instr_dict[i]["match"]}\n'
-        mask_match_str += f'#define MASK_{i.upper().replace(".","_")} {instr_dict[i]["mask"]}\n'
-        declare_insn_str += f'DECLARE_INSN({i.replace(".","_")}, MATCH_{i.upper().replace(".","_")}, MASK_{i.upper().replace(".","_")})\n'
-
-    csr_names_str = ''
-    declare_csr_str = ''
-    for num, name in csrs+csrs32:
-        csr_names_str += f'#define CSR_{name.upper()} {hex(num)}\n'
-        declare_csr_str += f'DECLARE_CSR({name}, CSR_{name.upper()})\n'
-
-    causes_str= ''
-    declare_cause_str = ''
-    for num, name in causes:
-        causes_str += f"#define CAUSE_{name.upper().replace(' ', '_')} {hex(num)}\n"
-        declare_cause_str += f"DECLARE_CAUSE(\"{name}\", CAUSE_{name.upper().replace(' ','_')})\n"
-
-    arg_str = ''
-    for name, rng in arg_lut.items():
-        begin = rng[1]
-        end   = rng[0]
-        mask = ((1 << (end - begin + 1)) - 1) << begin
-        arg_str += f"#define INSN_FIELD_{name.upper().replace(' ', '_')} {hex(mask)}\n"
-
-    with open(f'{os.path.dirname(__file__)}/encoding.h', 'r') as file:
-        enc_header = file.read()
-
-    commit = os.popen('git log -1 --format="format:%h"').read()
-    enc_file = open('encoding.out.h','w')
-    enc_file.write(f'''/* SPDX-License-Identifier: BSD-3-Clause */
-
-/* Copyright (c) 2023 RISC-V International */
-
-/*
- * This file is auto-generated by running 'make' in
- * https://github.com/riscv/riscv-opcodes ({commit})
- */
-
-{enc_header}
-/* Automatically generated by parse_opcodes. */
-#ifndef RISCV_ENCODING_H
-#define RISCV_ENCODING_H
-{mask_match_str}
-{csr_names_str}
-{causes_str}
-{arg_str}#endif
-#ifdef DECLARE_INSN
-{declare_insn_str}#endif
-#ifdef DECLARE_CSR
-{declare_csr_str}#endif
-#ifdef DECLARE_CAUSE
-{declare_cause_str}#endif
-''')
-    enc_file.close()
-
-def make_go(instr_dict):
-
-    args = " ".join(sys.argv)
-    prelude = f'''// Code generated by {args}; DO NOT EDIT.'''
-
-    prelude += '''
-package riscv
-
-import "cmd/internal/obj"
-
-type inst struct {
-	opcode uint32
-	funct3 uint32
-	rs1    uint32
-	rs2    uint32
-	csr    int64
-	funct7 uint32
-}
-
-func encode(a obj.As) *inst {
-	switch a {
-'''
-
-    endoffile = '''  }
-	return nil
-}
-'''
-
-    instr_str = ''
-    for i in instr_dict:
-        enc_match = int(instr_dict[i]['match'],0)
-        opcode = (enc_match >> 0) & ((1<<7)-1)
-        funct3 = (enc_match >> 12) & ((1<<3)-1)
-        rs1 = (enc_match >> 15) & ((1<<5)-1)
-        rs2 = (enc_match >> 20) & ((1<<5)-1)
-        csr = (enc_match >> 20) & ((1<<12)-1)
-        funct7 = (enc_match >> 25) & ((1<<7)-1)
-        instr_str += f'''  case A{i.upper().replace("_","")}:
-    return &inst{{ {hex(opcode)}, {hex(funct3)}, {hex(rs1)}, {hex(rs2)}, {signed(csr,12)}, {hex(funct7)} }}
-'''
-        
-    with open('inst.go','w') as file:
-        file.write(prelude)
-        file.write(instr_str)
-        file.write(endoffile)
-
-    try:
-        import subprocess
-        subprocess.run(["go", "fmt", "inst.go"])
-    except:
-        pass
-
-def signed(value, width):
-  if 0 <= value < (1<<(width-1)):
-    return value
-  else:
-    return value - (1<<width)
-
-
-if __name__ == "__main__":
+def main():
+    """
+    Main function for processing and generation of files based on command-line arguments.
+    """
     print(f'Running with args : {sys.argv}')
-
-    extensions = sys.argv[1:]
-    for i in ['-c','-latex','-chisel','-sverilog','-rust', '-go', '-spinalhdl']:
-        if i in extensions:
-            extensions.remove(i)
+    extensions = remove_non_extensions(sys.argv)
     print(f'Extensions selected : {extensions}')
 
-    include_pseudo = False
-    if "-go" in sys.argv[1:]:
-        include_pseudo = True
-
-    instr_dict = create_inst_dict(extensions, include_pseudo)
-
-    with open('instr_dict.yaml', 'w') as outfile:
-        yaml.dump(add_segmented_vls_insn(instr_dict), outfile, default_flow_style=False)
-    instr_dict = collections.OrderedDict(sorted(instr_dict.items()))
-
-    if '-c' in sys.argv[1:]:
-        instr_dict_c = create_inst_dict(extensions, False, 
-                                        include_pseudo_ops=emitted_pseudo_ops)
-        instr_dict_c = collections.OrderedDict(sorted(instr_dict_c.items()))
-        make_c(instr_dict_c)
-        logging.info('encoding.out.h generated successfully')
+    include_pseudo = '-go' in sys.argv[1:]
+    instr_dict = process_instruction_dict(extensions, include_pseudo)
 
-    if '-chisel' in sys.argv[1:]:
-        make_chisel(instr_dict)
-        logging.info('inst.chisel generated successfully')
+    write_yaml(instr_dict)
+    generate_outputs(instr_dict, sys.argv[1:])
 
-    if '-spinalhdl' in sys.argv[1:]:
-        make_chisel(instr_dict, True)
-        logging.info('inst.spinalhdl generated successfully')
-
-    if '-sverilog' in sys.argv[1:]:
-        make_sverilog(instr_dict)
-        logging.info('inst.sverilog generated successfully')
-
-    if '-rust' in sys.argv[1:]:
-        make_rust(instr_dict)
-        logging.info('inst.rs generated successfully')
-
-    if '-go' in sys.argv[1:]:
-        make_go(instr_dict)
-        logging.info('inst.go generated successfully')
-
-    if '-latex' in sys.argv[1:]:
-        make_latex_table()
-        logging.info('instr-table.tex generated successfully')
-        make_priv_latex_table()
-        logging.info('priv-instr-table.tex generated successfully')
+if __name__ == "__main__":
+    main()
diff --git a/rust_utils.py b/rust_utils.py
new file mode 100644
index 00000000..6f540a25
--- /dev/null
+++ b/rust_utils.py
@@ -0,0 +1,31 @@
+from constants import *
+import copy
+import re
+import glob
+import os
+import pprint
+import logging
+import collections
+import yaml
+import sys
+# from shared_utils import overlaps, overlap_allowed, extension_overlap_allowed, instruction_overlap_allowed, process_enc_line, same_base_isa, add_segmented_vls_insn, expand_nf_field
+from shared_utils import *
+
+pp = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
+
+def make_rust(instr_dict):
+    mask_match_str= ''
+    for i in instr_dict:
+        mask_match_str += f'const MATCH_{i.upper().replace(".","_")}: u32 = {(instr_dict[i]["match"])};\n'
+        mask_match_str += f'const MASK_{i.upper().replace(".","_")}: u32 = {(instr_dict[i]["mask"])};\n'
+    for num, name in csrs+csrs32:
+        mask_match_str += f'const CSR_{name.upper()}: u16 = {hex(num)};\n'
+    for num, name in causes:
+        mask_match_str += f'const CAUSE_{name.upper().replace(" ","_")}: u8 = {hex(num)};\n'
+    rust_file = open('inst.rs','w')
+    rust_file.write(f'''
+/* Automatically generated by parse_opcodes */
+{mask_match_str}
+''')
+    rust_file.close()
diff --git a/shared_utils.py b/shared_utils.py
new file mode 100644
index 00000000..0fc6db91
--- /dev/null
+++ b/shared_utils.py
@@ -0,0 +1,547 @@
+#!/usr/bin/env python3
+import copy
+import re
+import glob
+import os
+import pprint
+import logging
+
+from constants import *
+
+LOG_FORMAT = '%(levelname)s:: %(message)s'
+LOG_LEVEL = logging.INFO
+
+pretty_printer = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=LOG_LEVEL, format=LOG_FORMAT)
+
+
+def process_enc_line(line, ext):
+    '''
+    This function processes each line of the encoding files (rv*). As part of
+    the processing, the function ensures that the encoding is legal through the
+    following checks::
+
+        - there is no over specification (same bits assigned different values)
+        - there is no under specification (some bits not assigned values)
+        - bit ranges are in the format hi..lo=val where hi > lo
+        - value assigned is representable in the bit range
+        - also checks that the mapping of arguments of an instruction exists in
+          arg_lut.
+
+    If the above checks pass, then the function returns a tuple of the name and
+    a dictionary containing basic information of the instruction which includes:
+        - variables: list of arguments used by the instruction whose mapping
+          exists in the arg_lut dictionary
+        - encoding: this contains the 32-bit encoding of the instruction where
+          '-' is used to represent position of arguments and 1/0 is used to
+          reprsent the static encoding of the bits
+        - extension: this field contains the rv* filename from which this
+          instruction was included
+        - match: hex value representing the bits that need to match to detect
+          this instruction
+        - mask: hex value representin the bits that need to be masked to extract
+          the value required for matching.
+    '''
+    encoding = initialize_encoding()
+    name, remaining = parse_instruction_name(line)
+
+    # Fixed ranges of the form hi..lo=val
+    process_fixed_ranges(remaining, encoding, line)
+
+    # Single fixed values of the form <lsb>=<val>
+    remaining = process_single_fixed(remaining, encoding, line)
+
+    # Create match and mask strings
+    match, mask = create_match_and_mask(encoding)
+
+    # Process instruction arguments
+    args = process_arguments(remaining, encoding, name)
+
+    # Create and return the final instruction dictionary
+    instruction_dict = create_instruction_dict(encoding, args, ext, match, mask)
+
+    return name, instruction_dict
+
+
+def initialize_encoding():
+    """Initialize a 32-bit encoding with '-' representing 'don't care'."""
+    return ['-'] * 32
+
+
+def parse_instruction_name(line):
+    """Extract the instruction name and remaining part of the line."""
+    name, remaining = line.split(' ', 1)
+    name = name.replace('.', '_').lstrip()
+    return name, remaining
+
+
+def process_fixed_ranges(remaining, encoding, line):
+    """Process bit ranges of the form hi..lo=val, checking for errors and updating encoding."""
+    for s2, s1, entry in fixed_ranges.findall(remaining):
+        msb, lsb = int(s2), int(s1)
+        validate_bit_range(msb, lsb, line)
+        validate_entry_value(msb, lsb, entry, line)
+        update_encoding(msb, lsb, entry, encoding, line)
+
+
+def validate_bit_range(msb, lsb, line):
+    """Ensure that msb > lsb and raise an error if not."""
+    if msb < lsb:
+        log_and_exit(f"{get_instruction_name(line)} has msb < lsb in its encoding")
+
+
+def validate_entry_value(msb, lsb, entry, line):
+    """Ensure that the value assigned to a bit range is legal for its width."""
+    entry_value = int(entry, 0)
+    if entry_value >= (1 << (msb - lsb + 1)):
+        log_and_exit(f"{get_instruction_name(line)} has an illegal value for the bit width {msb - lsb}")
+
+
+def update_encoding(msb, lsb, entry, encoding, line):
+    """Update the encoding array for a given bit range."""
+    entry_value = int(entry, 0)
+    for ind in range(lsb, msb + 1):
+        if encoding[31 - ind] != '-':
+            log_and_exit(f"{get_instruction_name(line)} has overlapping bits in its opcodes")
+        encoding[31 - ind] = str((entry_value >> (ind - lsb)) & 1)
+
+
+def process_single_fixed(remaining, encoding, line):
+    """Process single fixed values of the form <lsb>=<val>."""
+    for lsb, value, _ in single_fixed.findall(remaining):
+        lsb = int(lsb, 0)
+        value = int(value, 0)
+        if encoding[31 - lsb] != '-':
+            log_and_exit(f"{get_instruction_name(line)} has overlapping bits in its opcodes")
+        encoding[31 - lsb] = str(value)
+    return fixed_ranges.sub(' ', remaining)
+
+
+def create_match_and_mask(encoding):
+    """Generate match and mask strings from the encoding array."""
+    match = ''.join(encoding).replace('-', '0')
+    mask = ''.join(encoding).replace('0', '1').replace('-', '0')
+    return match, mask
+
+
+def process_arguments(remaining, encoding, name):
+    """Process instruction arguments and update the encoding with argument positions."""
+    args = single_fixed.sub(' ', remaining).split()
+    encoding_args = encoding.copy()
+    for arg in args:
+        if arg not in arg_lut:
+            handle_missing_arg(arg, name)
+        msb, lsb = arg_lut[arg]
+        update_arg_encoding(msb, lsb, arg, encoding_args, name)
+    return args, encoding_args
+
+
+def handle_missing_arg(arg, name):
+    """Handle missing argument mapping in arg_lut."""
+    if '=' in arg and (existing_arg := arg.split('=')[0]) in arg_lut:
+        arg_lut[arg] = arg_lut[existing_arg]
+    else:
+        log_and_exit(f"Variable {arg} in instruction {name} not mapped in arg_lut")
+
+
+def update_arg_encoding(msb, lsb, arg, encoding_args, name):
+    """Update the encoding array with the argument positions."""
+    for ind in range(lsb, msb + 1):
+        if encoding_args[31 - ind] != '-':
+            log_and_exit(f"Variable {arg} overlaps in bit {ind} in instruction {name}")
+        encoding_args[31 - ind] = arg
+
+
+def create_instruction_dict(encoding, args, ext, match, mask):
+    """Create the final dictionary for the instruction."""
+    return {
+        'encoding': ''.join(encoding),
+        'variable_fields': args,
+        'extension': [os.path.basename(ext)],
+        'match': hex(int(match, 2)),
+        'mask': hex(int(mask, 2)),
+    }
+
+
+def log_and_exit(message):
+    """Log an error message and exit the program."""
+    logging.error(message)
+    raise SystemExit(1)
+
+
+def get_instruction_name(line):
+    """Helper to extract the instruction name from a line."""
+    return line.split(' ')[0]
+
+def overlaps(x, y):
+    """
+    Check if two bit strings overlap without conflicts.
+    
+    Args:
+        x (str): First bit string.
+        y (str): Second bit string.
+    
+    Returns:
+        bool: True if the bit strings overlap without conflicts, False otherwise.
+        
+    In the context of RISC-V opcodes, this function ensures that the bit ranges 
+    defined by two different bit strings do not conflict.
+    """
+    
+    # Minimum length of the two strings
+    min_len = min(len(x), len(y))
+    
+    for char_x, char_y in zip(x[:min_len], y[:min_len]):
+        if char_x != '-' and char_y != '-' and char_x != char_y:
+            return False
+    
+    return True
+
+
+def overlap_allowed(a, x, y):
+    """
+    Check if there is an overlap between keys and values in a dictionary.
+    
+    Args:
+        a (dict): The dictionary where keys are mapped to sets or lists of keys.
+        x (str): The first key to check.
+        y (str): The second key to check.
+    
+    Returns:
+        bool: True if both (x, y) or (y, x) are present in the dictionary 
+              as described, False otherwise.
+        
+    This function determines if `x` is a key in the dictionary `a` and 
+    its corresponding value contains `y`, or if `y` is a key and its 
+    corresponding value contains `x`.
+    """
+    
+    return x in a and y in a[x] or \
+           y in a and x in a[y]
+
+
+# Checks if overlap between two extensions is allowed
+def extension_overlap_allowed(x, y):
+    return overlap_allowed(overlapping_extensions, x, y)
+
+
+# Checks if overlap between two instructions is allowed
+def instruction_overlap_allowed(x, y):
+    return overlap_allowed(overlapping_instructions, x, y)
+
+
+# Checks if ext_name shares the same base ISA with any in ext_name_list
+def same_base_isa(ext_name, ext_name_list):
+    type1 = ext_name.split("_")[0]
+    for ext_name1 in ext_name_list:
+        type2 = ext_name1.split("_")[0]
+        if type1 == type2 or \
+           (type2 == "rv" and type1 in ["rv32", "rv64"]) or \
+           (type1 == "rv" and type2 in ["rv32", "rv64"]):
+            return True
+    return False
+
+
+# Expands instructions with "nf" field in variable_fields, otherwise returns unchanged
+def add_segmented_vls_insn(instr_dict):
+    updated_dict = {}
+    for k, v in instr_dict.items():
+        if "nf" in v['variable_fields']:
+            updated_dict.update(expand_nf_field(k, v))
+        else:
+            updated_dict[k] = v
+    return updated_dict
+
+
+# Expands nf field in instruction name and updates instruction details
+def expand_nf_field(name, single_dict):
+    if "nf" not in single_dict['variable_fields']:
+        logging.error(f"Cannot expand nf field for instruction {name}")
+        raise SystemExit(1)
+
+    single_dict['variable_fields'].remove("nf")  # Remove "nf" from variable fields
+    single_dict['mask'] = hex(int(single_dict['mask'], 16) | (0b111 << 29))  # Update mask
+
+    name_expand_index = name.find('e')
+    expanded_instructions = []
+    for nf in range(8):  # Expand nf for values 0 to 7
+        new_single_dict = copy.deepcopy(single_dict)
+        new_single_dict['match'] = hex(int(single_dict['match'], 16) | (nf << 29))
+        new_single_dict['encoding'] = format(nf, '03b') + single_dict['encoding'][3:]
+        new_name = name if nf == 0 else f"{name[:name_expand_index]}seg{nf+1}{name[name_expand_index:]}"
+        expanded_instructions.append((new_name, new_single_dict))
+    return expanded_instructions
+
+
+# Extracts the extensions used in an instruction dictionary
+def instr_dict_2_extensions(instr_dict):
+    return list({item['extension'][0] for item in instr_dict.values()})
+
+
+# Returns signed interpretation of a value within a given width
+def signed(value, width):
+    return value if 0 <= value < (1 << (width - 1)) else value - (1 << width)
+
+
+def create_inst_dict(file_filter, include_pseudo=False, include_pseudo_ops=[]):
+    '''
+    This function return a dictionary containing all instructions associated
+    with an extension defined by the file_filter input. The file_filter input
+    needs to be rv* file name with out the 'rv' prefix i.e. '_i', '32_i', etc.
+
+    Each node of the dictionary will correspond to an instruction which again is
+    a dictionary. The dictionary contents of each instruction includes:
+        - variables: list of arguments used by the instruction whose mapping
+          exists in the arg_lut dictionary
+        - encoding: this contains the 32-bit encoding of the instruction where
+          '-' is used to represent position of arguments and 1/0 is used to
+          reprsent the static encoding of the bits
+        - extension: this field contains the rv* filename from which this
+          instruction was included
+        - match: hex value representing the bits that need to match to detect
+          this instruction
+        - mask: hex value representin the bits that need to be masked to extract
+          the value required for matching.
+
+    In order to build this dictionary, the function does 2 passes over the same
+    rv<file_filter> file. The first pass is to extract all standard
+    instructions. In this pass, all pseudo ops and imported instructions are
+    skipped. For each selected line of the file, we call process_enc_line
+    function to create the above mentioned dictionary contents of the
+    instruction. Checks are performed in this function to ensure that the same
+    instruction is not added twice to the overall dictionary.
+
+    In the second pass, this function parses only pseudo_ops. For each pseudo_op
+    this function checks if the dependent extension and instruction, both, exist
+    before parsing it. The pseudo op is only added to the overall dictionary if
+    the dependent instruction is not present in the dictionary, else it is
+    skipped.
+
+
+    '''
+    opcodes_dir = os.path.dirname(os.path.realpath(__file__))
+    instr_dict = {}
+
+    # file_names contains all files to be parsed in the riscv-opcodes directory
+    file_names = []
+    for fil in file_filter:
+        file_names += glob.glob(f'{opcodes_dir}/{fil}')
+    file_names.sort(reverse=True)
+    # first pass if for standard/regular instructions
+    logging.debug('Collecting standard instructions first')
+    for f in file_names:
+        logging.debug(f'Parsing File: {f} for standard instructions')
+        with open(f) as fp:
+            lines = (line.rstrip()
+                     for line in fp)  # All lines including the blank ones
+            lines = list(line for line in lines if line)  # Non-blank lines
+            lines = list(
+                line for line in lines
+                if not line.startswith("#"))  # remove comment lines
+
+        # go through each line of the file
+        for line in lines:
+            # if the an instruction needs to be imported then go to the
+            # respective file and pick the line that has the instruction.
+            # The variable 'line' will now point to the new line from the
+            # imported file
+
+            # ignore all lines starting with $import and $pseudo
+            if '$import' in line or '$pseudo' in line:
+                continue
+            logging.debug(f'     Processing line: {line}')
+
+            # call process_enc_line to get the data about the current
+            # instruction
+            (name, single_dict) = process_enc_line(line, f)
+            ext_name = os.path.basename(f)
+
+            # if an instruction has already been added to the filtered
+            # instruction dictionary throw an error saying the given
+            # instruction is already imported and raise SystemExit
+            if name in instr_dict:
+                var = instr_dict[name]["extension"]
+                if same_base_isa(ext_name, var):
+                    # disable same names on the same base ISA
+                    err_msg = f'instruction : {name} from '
+                    err_msg += f'{ext_name} is already '
+                    err_msg += f'added from {var} in same base ISA'
+                    logging.error(err_msg)
+                    raise SystemExit(1)
+                elif instr_dict[name]['encoding'] != single_dict['encoding']:
+                    # disable same names with different encodings on different base ISAs
+                    err_msg = f'instruction : {name} from '
+                    err_msg += f'{ext_name} is already '
+                    err_msg += f'added from {var} but each have different encodings in different base ISAs'
+                    logging.error(err_msg)
+                    raise SystemExit(1)
+                instr_dict[name]['extension'].extend(single_dict['extension'])
+            else:
+              for key in instr_dict:
+                  item = instr_dict[key]
+                  if overlaps(item['encoding'], single_dict['encoding']) and \
+                    not extension_overlap_allowed(ext_name, item['extension'][0]) and \
+                    not instruction_overlap_allowed(name, key) and \
+                    same_base_isa(ext_name, item['extension']):
+                      # disable different names with overlapping encodings on the same base ISA
+                      err_msg = f'instruction : {name} in extension '
+                      err_msg += f'{ext_name} overlaps instruction {key} '
+                      err_msg += f'in extension {item["extension"]}'
+                      logging.error(err_msg)
+                      raise SystemExit(1)
+
+            if name not in instr_dict:
+                # update the final dict with the instruction
+                instr_dict[name] = single_dict
+
+    # second pass if for pseudo instructions
+    logging.debug('Collecting pseudo instructions now')
+    for f in file_names:
+        logging.debug(f'Parsing File: {f} for pseudo_ops')
+        with open(f) as fp:
+            lines = (line.rstrip()
+                     for line in fp)  # All lines including the blank ones
+            lines = list(line for line in lines if line)  # Non-blank lines
+            lines = list(
+                line for line in lines
+                if not line.startswith("#"))  # remove comment lines
+
+        # go through each line of the file
+        for line in lines:
+
+            # ignore all lines not starting with $pseudo
+            if '$pseudo' not in line:
+                continue
+            logging.debug(f'     Processing line: {line}')
+
+            # use the regex pseudo_regex from constants.py to find the dependent
+            # extension, dependent instruction, the pseudo_op in question and
+            # its encoding
+            (ext, orig_inst, pseudo_inst, line) = pseudo_regex.findall(line)[0]
+            ext_file = f'{opcodes_dir}/{ext}'
+
+            # check if the file of the dependent extension exist. Throw error if
+            # it doesn't
+            if not os.path.exists(ext_file):
+                ext1_file = f'{opcodes_dir}/unratified/{ext}'
+                if not os.path.exists(ext1_file):
+                    logging.error(f'Pseudo op {pseudo_inst} in {f} depends on {ext} which is not available')
+                    raise SystemExit(1)
+                else:
+                    ext_file = ext1_file
+
+            # check if the dependent instruction exist in the dependent
+            # extension. Else throw error.
+            found = False
+            for oline in open(ext_file):
+                if not re.findall(f'^\\s*{orig_inst}\\s+',oline):
+                    continue
+                else:
+                    found = True
+                    break
+            if not found:
+                logging.error(f'Orig instruction {orig_inst} not found in {ext}. Required by pseudo_op {pseudo_inst} present in {f}')
+                raise SystemExit(1)
+
+
+            (name, single_dict) = process_enc_line(pseudo_inst + ' ' + line, f)
+            # add the pseudo_op to the dictionary only if the original
+            # instruction is not already in the dictionary.
+            if orig_inst.replace('.','_') not in instr_dict \
+                    or include_pseudo \
+                    or name in include_pseudo_ops:
+
+                # update the final dict with the instruction
+                if name not in instr_dict:
+                    instr_dict[name] = single_dict
+                    logging.debug(f'        including pseudo_ops:{name}')
+                else:
+                    if(single_dict['match'] != instr_dict[name]['match']):
+                        instr_dict[name + '_pseudo'] = single_dict
+
+                    # if a pseudo instruction has already been added to the filtered
+                    # instruction dictionary but the extension is not in the current
+                    # list, add it
+                    else:
+                        ext_name = single_dict['extension']
+
+                    if (ext_name not in instr_dict[name]['extension']) & (name + '_pseudo' not in instr_dict):
+                        instr_dict[name]['extension'].extend(ext_name)
+            else:
+                logging.debug(f'        Skipping pseudo_op {pseudo_inst} since original instruction {orig_inst} already selected in list')
+
+    # third pass if for imported instructions
+    logging.debug('Collecting imported instructions')
+    for f in file_names:
+        logging.debug(f'Parsing File: {f} for imported ops')
+        with open(f) as fp:
+            lines = (line.rstrip()
+                     for line in fp)  # All lines including the blank ones
+            lines = list(line for line in lines if line)  # Non-blank lines
+            lines = list(
+                line for line in lines
+                if not line.startswith("#"))  # remove comment lines
+
+        # go through each line of the file
+        for line in lines:
+            # if the an instruction needs to be imported then go to the
+            # respective file and pick the line that has the instruction.
+            # The variable 'line' will now point to the new line from the
+            # imported file
+
+            # ignore all lines starting with $import and $pseudo
+            if '$import' not in line :
+                continue
+            logging.debug(f'     Processing line: {line}')
+
+            (import_ext, reg_instr) = imported_regex.findall(line)[0]
+            import_ext_file = f'{opcodes_dir}/{import_ext}'
+
+            # check if the file of the dependent extension exist. Throw error if
+            # it doesn't
+            if not os.path.exists(import_ext_file):
+                ext1_file = f'{opcodes_dir}/unratified/{import_ext}'
+                if not os.path.exists(ext1_file):
+                    logging.error(f'Instruction {reg_instr} in {f} cannot be imported from {import_ext}')
+                    raise SystemExit(1)
+                else:
+                    ext_file = ext1_file
+            else:
+                ext_file = import_ext_file
+
+            # check if the dependent instruction exist in the dependent
+            # extension. Else throw error.
+            found = False
+            for oline in open(ext_file):
+                if not re.findall(f'^\\s*{reg_instr}\\s+',oline):
+                    continue
+                else:
+                    found = True
+                    break
+            if not found:
+                logging.error(f'imported instruction {reg_instr} not found in {ext_file}. Required by {line} present in {f}')
+                logging.error(f'Note: you cannot import pseudo/imported ops.')
+                raise SystemExit(1)
+
+            # call process_enc_line to get the data about the current
+            # instruction
+            (name, single_dict) = process_enc_line(oline, f)
+
+            # if an instruction has already been added to the filtered
+            # instruction dictionary throw an error saying the given
+            # instruction is already imported and raise SystemExit
+            if name in instr_dict:
+                var = instr_dict[name]["extension"]
+                if instr_dict[name]['encoding'] != single_dict['encoding']:
+                    err_msg = f'imported instruction : {name} in '
+                    err_msg += f'{os.path.basename(f)} is already '
+                    err_msg += f'added from {var} but each have different encodings for the same instruction'
+                    logging.error(err_msg)
+                    raise SystemExit(1)
+                instr_dict[name]['extension'].extend(single_dict['extension'])
+            else:
+                # update the final dict with the instruction
+                instr_dict[name] = single_dict
+    return instr_dict
+
+
diff --git a/sverilog_utils.py b/sverilog_utils.py
new file mode 100644
index 00000000..4a6ace10
--- /dev/null
+++ b/sverilog_utils.py
@@ -0,0 +1,30 @@
+import re
+import glob
+import os
+import pprint
+import logging
+import collections
+import yaml
+import sys
+# from shared_utils import overlaps, overlap_allowed, extension_overlap_allowed, instruction_overlap_allowed, process_enc_line, same_base_isa, add_segmented_vls_insn, expand_nf_field
+from shared_utils import *
+
+pp = pprint.PrettyPrinter(indent=2)
+logging.basicConfig(level=logging.INFO, format='%(levelname)s:: %(message)s')
+
+def make_sverilog(instr_dict):
+    names_str = ''
+    for i in instr_dict:
+        names_str += f"  localparam [31:0] {i.upper().replace('.','_'):<18s} = 32'b{instr_dict[i]['encoding'].replace('-','?')};\n"
+    names_str += '  /* CSR Addresses */\n'
+    for num, name in csrs+csrs32:
+        names_str += f"  localparam logic [11:0] CSR_{name.upper()} = 12'h{hex(num)[2:]};\n"
+
+    sverilog_file = open('inst.sverilog','w')
+    sverilog_file.write(f'''
+/* Automatically generated by parse_opcodes */
+package riscv_instr;
+{names_str}
+endpackage
+''')
+    sverilog_file.close()
\ No newline at end of file