us_disassemble2: invent a better fragment shader syntax

This commit is contained in:
Zack Buhman 2025-10-19 20:29:33 -05:00
parent 0879b6b8f1
commit 59b6b2a0d2
4 changed files with 365 additions and 10 deletions

View File

@ -64,7 +64,7 @@ ADDR2_REL 29 0x0 Specifies whether the loop register is added to
01 - RELATIVE: Add aL before lookup.
SRCP_OP 31:30 0x0 Specifies how the pre-subtract value (SRCP) is computed.
POSSIBLE VALUES:
00 - 1.0-2.0*A0
01 - A1-A0
02 - A1+A0
03 - 1.0-A0
00 - neg2: 1.0-2.0*A0
01 - sub: A1-A0
02 - add: A1+A0
03 - neg: 1.0-A0

View File

@ -65,7 +65,7 @@ ADDR2_REL 29 0x0 Specifies whether the loop register is added to
SRCP_OP 31:30 0x0 Specifies how the pre-subtract value (SRCP) is
computed.
POSSIBLE VALUES:
00 - 1.0-2.0*RGB0
01 - RGB1-RGB0
02 - RGB1+RGB0
03 - 1.0-RGB0
00 - neg2: 1.0-2.0*RGB0
01 - sub: RGB1-RGB0
02 - add: RGB1+RGB0
03 - neg: 1.0-RGB0

View File

@ -45,8 +45,10 @@ fc = [
]
def parse_registers():
base = path.dirname(__file__)
for register in register_names:
filename = path.join("bits", register.lower() + ".txt")
filename = path.join(base, "bits", register.lower() + ".txt")
l = list(parse_bits.parse_file_fields(filename))
yield register, OrderedDict(
(d.field_name, d) for d in parse_bits.aggregate(l)
@ -142,5 +144,4 @@ if __name__ == "__main__":
buf = f.read()
code = [parse_hex(c.strip()) for c in buf.split(',') if c.strip()]
for i in range(len(code) // 6):
disassemble(code, i * 6)

354
regs/us_disassemble2.py Normal file
View File

@ -0,0 +1,354 @@
import sys
from os import path
import parse_bits
from collections import OrderedDict
from functools import partial
from pprint import pprint
VERBOSE = False
class BaseRegister:
def get(self, code, *, code_ix, descriptor):
n = code[code_ix]
if type(descriptor.bits) is int:
return (n >> descriptor.bits) & 1
else:
high, low = descriptor.bits
assert high > low
mask_length = (high - low) + 1
mask = (1 << mask_length) - 1
return (n >> low) & mask
def get_name(self, n, *, code_ix, descriptor):
value = self.get(n, code_ix=code_ix, descriptor=descriptor)
return value, *descriptor.possible_values[value]
_descriptor_indicies = {
"US_CMN_INST": 0,
"US_ALU_RGB_ADDR": 1,
"US_ALU_ALPHA_ADDR": 2,
"US_ALU_RGB_INST": 3,
"US_ALU_ALPHA_INST": 4,
"US_ALU_RGBA_INST": 5,
"US_TEX_INST": 1,
"US_TEX_ADDR": 2,
"US_TEX_ADDR_DXDY": 3,
"US_FC_INST": 2,
"US_FC_ADDR": 3,
}
def parse_register(register_name):
base = path.dirname(__file__)
filename = path.join(base, "bits", register_name.lower() + ".txt")
l = list(parse_bits.parse_file_fields(filename))
cls = type(register_name, (BaseRegister,), {})
instance = cls()
descriptors = list(parse_bits.aggregate(l))
code_ix = _descriptor_indicies[register_name]
for descriptor in descriptors:
setattr(instance, descriptor.field_name,
partial(instance.get, code_ix=code_ix, descriptor=descriptor))
setattr(instance, f"_{descriptor.field_name}",
partial(instance.get_name, code_ix=code_ix, descriptor=descriptor))
func = getattr(instance, descriptor.field_name)
for pv_value, (pv_name, _) in descriptor.possible_values.items():
if pv_name is not None:
setattr(func, pv_name, pv_value)
assert getattr(instance, "descriptors", None) is None
instance.descriptors = descriptors
return instance
US_CMN_INST = parse_register("US_CMN_INST")
US_ALU_RGB_ADDR = parse_register("US_ALU_RGB_ADDR")
US_ALU_ALPHA_ADDR = parse_register("US_ALU_ALPHA_ADDR")
US_ALU_RGB_INST = parse_register("US_ALU_RGB_INST")
US_ALU_ALPHA_INST = parse_register("US_ALU_ALPHA_INST")
US_ALU_RGBA_INST = parse_register("US_ALU_RGBA_INST")
US_TEX_INST = parse_register("US_TEX_INST")
US_TEX_ADDR = parse_register("US_TEX_ADDR")
US_TEX_ADDR_DXDY = parse_register("US_TEX_ADDR_DXDY")
US_FC_INST = parse_register("US_FC_INST")
US_FC_ADDR = parse_register("US_FC_ADDR")
def disassemble_addr_inner(register_const, address, const, rel):
assert rel == 0
if const == register_const.TEMPORARY:
if address & (1 << 7):
value = address & 0x7f
return f"float({value})"
else:
return f"temp[{address}]"
elif const == register_const.CONSTANT:
return f"const[{address}]"
else:
assert False, const
swizzle_strs = ['r', 'g', 'b', 'a', '0', 'h', '1', '_']
sel_strs = ['0', '1', '2', 'p']
def disassemble_addr(register, code, suffix):
addr0 = register.ADDR0(code)
addr0_const = register.ADDR0_CONST(code)
addr0_rel = register.ADDR0_REL(code)
addr1 = register.ADDR1(code)
addr1_const = register.ADDR1_CONST(code)
addr1_rel = register.ADDR1_REL(code)
addr2 = register.ADDR2(code)
addr2_const = register.ADDR2_CONST(code)
addr2_rel = register.ADDR2_REL(code)
_, srcp_op, _ = register._SRCP_OP(code)
s0 = disassemble_addr_inner(register.ADDR0_CONST, addr0, addr0_const, addr0_rel)
s1 = disassemble_addr_inner(register.ADDR1_CONST, addr1, addr1_const, addr1_rel)
s2 = disassemble_addr_inner(register.ADDR2_CONST, addr2, addr2_const, addr2_rel)
sp = srcp_op.lower()
return [
f"src{sel_strs[i]}.{suffix} = {s}"
for i, s in enumerate([s0, s1, s2, sp])
]
def mod_str(s, mod):
if mod == 0: # NOP
return s
elif mod == 1: # NEG
return f"-{s}"
elif mod == 2: # ABS
return f"|{s}|"
elif mod == 3: # NAB
return f"-|{s}|"
else:
assert False, mod
def disassemble_rgb_swizzle_sel(code):
rgb_sel_a = US_ALU_RGB_INST.RGB_SEL_A(code)
red_swiz_a = US_ALU_RGB_INST.RED_SWIZ_A(code)
green_swiz_a = US_ALU_RGB_INST.GREEN_SWIZ_A(code)
blue_swiz_a = US_ALU_RGB_INST.BLUE_SWIZ_A(code)
rgb_mod_a = US_ALU_RGB_INST.RGB_MOD_A(code)
rgb_sel_b = US_ALU_RGB_INST.RGB_SEL_B(code)
red_swiz_b = US_ALU_RGB_INST.RED_SWIZ_B(code)
green_swiz_b = US_ALU_RGB_INST.GREEN_SWIZ_B(code)
blue_swiz_b = US_ALU_RGB_INST.BLUE_SWIZ_B(code)
rgb_mod_b = US_ALU_RGB_INST.RGB_MOD_B(code)
rgb_sel_c = US_ALU_RGBA_INST.RGB_SEL_C(code)
red_swiz_c = US_ALU_RGBA_INST.RED_SWIZ_C(code)
green_swiz_c = US_ALU_RGBA_INST.GREEN_SWIZ_C(code)
blue_swiz_c = US_ALU_RGBA_INST.BLUE_SWIZ_C(code)
rgb_mod_c = US_ALU_RGBA_INST.RGB_MOD_C(code)
rgb_swiz_a = ''.join(swizzle_strs[n] for n in [red_swiz_a, green_swiz_a, blue_swiz_a])
rgb_swiz_b = ''.join(swizzle_strs[n] for n in [red_swiz_b, green_swiz_b, blue_swiz_b])
rgb_swiz_c = ''.join(swizzle_strs[n] for n in [red_swiz_c, green_swiz_c, blue_swiz_c])
rgb_swiz = [rgb_swiz_a, rgb_swiz_b, rgb_swiz_c]
rgb_sels = [rgb_sel_a, rgb_sel_b, rgb_sel_c]
rgb_mods = [rgb_mod_a, rgb_mod_b, rgb_mod_c]
return [mod_str(f"src{sel_strs[sel]}.{swiz}", mod)
for swiz, sel, mod in zip(rgb_swiz, rgb_sels, rgb_mods)], rgb_sels
def disassemble_a_swizzle_sel(code):
alpha_sel_a = US_ALU_ALPHA_INST.ALPHA_SEL_A(code)
alpha_swiz_a = US_ALU_ALPHA_INST.ALPHA_SWIZ_A(code)
alpha_mod_a = US_ALU_ALPHA_INST.ALPHA_MOD_A(code)
alpha_sel_b = US_ALU_ALPHA_INST.ALPHA_SEL_B(code)
alpha_swiz_b = US_ALU_ALPHA_INST.ALPHA_SWIZ_B(code)
alpha_mod_b = US_ALU_ALPHA_INST.ALPHA_MOD_B(code)
alpha_sel_c = US_ALU_RGBA_INST.ALPHA_SEL_C(code)
alpha_swiz_c = US_ALU_RGBA_INST.ALPHA_SWIZ_C(code)
alpha_mod_c = US_ALU_RGBA_INST.ALPHA_MOD_C(code)
a_swiz = [swizzle_strs[n] for n in [alpha_swiz_a, alpha_swiz_b, alpha_swiz_c]]
a_sels = [alpha_sel_a, alpha_sel_b, alpha_sel_c]
a_mods = [alpha_mod_a, alpha_mod_b, alpha_mod_c]
return [mod_str(f"src{sel_strs[sel]}.{swiz}", mod)
for swiz, sel, mod in zip(a_swiz, a_sels, a_mods)], a_sels
def omod_str(s, mod):
if s == 0: # * 1
return s
elif s == 1: # * 1
return f"({s}) * 1"
elif s == 2: # * 2
return f"({s}) * 2"
elif s == 3: # * 4
return f"({s}) * 4"
elif s == 4: # * 8
return f"({s}) * 8"
elif s == 5: # / 2
return f"({s}) / 2"
elif s == 6: # / 4
return f"({s}) / 4"
elif s == 7: # DISABLE OMOD
return s
def disassemble_alu_dest(code):
a_addrd = US_ALU_ALPHA_INST.ALPHA_ADDRD(code)
a_addrd_rel = US_ALU_ALPHA_INST.ALPHA_ADDRD_REL(code)
assert a_addrd_rel == 0
rgb_addrd = US_ALU_RGBA_INST.RGB_ADDRD(code)
rgb_addrd_rel = US_ALU_RGBA_INST.RGB_ADDRD_REL(code)
assert rgb_addrd_rel == 0
_, rgb_wmask, _ = US_CMN_INST._RGB_WMASK(code)
_, a_wmask, _ = US_CMN_INST._ALPHA_WMASK(code)
_, rgb_omask, _ = US_CMN_INST._RGB_OMASK(code)
_, a_omask, _ = US_CMN_INST._ALPHA_OMASK(code)
a_out_str = f"out[{a_addrd}].{a_omask.lower().ljust(4)}"
a_temp_str = f"temp[{a_addrd}].{a_wmask.lower().ljust(4)}"
rgb_out_str = f"out[{rgb_addrd}].{rgb_omask.lower().ljust(4)}"
rgb_temp_str = f"temp[{rgb_addrd}].{rgb_wmask.lower().ljust(4)}"
return (a_out_str, a_temp_str), (rgb_out_str, rgb_temp_str)
def assert_zeros(code):
rgb_pred_sel = US_CMN_INST.RGB_PRED_SEL(code)
assert rgb_pred_sel == 0
rgb_pred_inv = US_CMN_INST.RGB_PRED_INV(code)
assert rgb_pred_inv == 0
write_inactive = US_CMN_INST.WRITE_INACTIVE(code)
assert write_inactive == 0
last = US_CMN_INST.LAST(code)
assert last == 0
nop = US_CMN_INST.NOP(code)
assert nop == 0
alu_wait = US_CMN_INST.ALU_WAIT(code)
assert alu_wait == 0
rgb_clamp = US_CMN_INST.RGB_CLAMP(code)
assert rgb_clamp == 0
alpha_clamp = US_CMN_INST.ALPHA_CLAMP(code)
assert alpha_clamp == 0
alu_result_sel = US_CMN_INST.ALU_RESULT_SEL(code)
assert alu_result_sel == 0
alpha_pred_inv = US_CMN_INST.ALPHA_PRED_INV(code)
assert alpha_pred_inv == 0
alu_result_op = US_CMN_INST.ALU_RESULT_OP(code)
assert alu_result_op == 0
alpha_pred_sel = US_CMN_INST.ALPHA_PRED_SEL(code)
assert alpha_pred_sel == 0
stat_we = US_CMN_INST.STAT_WE(code)
assert stat_we == 0
rgb_omod = US_ALU_RGB_INST.OMOD(code)
rgb_target = US_ALU_RGB_INST.TARGET(code)
alu_wmask = US_ALU_RGB_INST.ALU_WMASK(code)
assert rgb_omod in {0, 7}
assert rgb_target == 0
assert alu_wmask == 0
a_omod = US_ALU_ALPHA_INST.OMOD(code)
a_target = US_ALU_ALPHA_INST.TARGET(code)
w_omask = US_ALU_ALPHA_INST.W_OMASK(code)
assert a_omod in {0, 7}
assert a_target == 0
assert w_omask == 0
_rgb_op_operands = {
"OP_MAD": 3,
"OP_DP3": 2,
"OP_DP4": 2,
"OP_D2A": 3,
"OP_MIN": 2,
"OP_MAX": 2,
"OP_CND": 3,
"OP_CMP": 3,
"OP_FRC": 1,
"OP_SOP": 0,
"OP_MDH": 3,
"OP_MDV": 3,
}
_a_op_operands = {
"OP_MAD": 3,
"OP_DP": 0,
"OP_MIN": 2,
"OP_MAX": 2,
"OP_CND": 3,
"OP_CMP": 3,
"OP_FRC": 1,
"OP_EX2": 1,
"OP_RCP": 1,
"OP_RSQ": 1,
"OP_SIN": 1,
"OP_COS": 1,
"OP_MDH": 3,
"OP_MDV": 3
}
def disassemble_alu(code, is_output):
assert_zeros(code)
a_addr_strs = disassemble_addr(US_ALU_ALPHA_ADDR, code, "a")
rgb_addr_strs = disassemble_addr(US_ALU_RGB_ADDR, code, "rgb")
a_swizzle_sel, a_sels = disassemble_a_swizzle_sel(code)
rgb_swizzle_sel, rgb_sels = disassemble_rgb_swizzle_sel(code)
#print(", ".join([*rgb_swizzle_sel, *a_swizzle_sel]))
tex_sem_wait = US_CMN_INST.TEX_SEM_WAIT(code)
_, a_op, _ = US_ALU_ALPHA_INST._ALPHA_OP(code)
_, rgb_op, _ = US_ALU_RGBA_INST._RGB_OP(code)
a_op_operands = _a_op_operands[a_op]
rgb_op_operands = _rgb_op_operands[rgb_op]
(a_out_str, a_temp_str), (rgb_out_str, rgb_temp_str) = disassemble_alu_dest(code)
if tex_sem_wait:
print("TEX_SEM_WAIT")
if not VERBOSE:
a_swizzle_sel = a_swizzle_sel[:a_op_operands]
rgb_swizzle_sel = rgb_swizzle_sel[:rgb_op_operands]
a_sources = set(a_sels)
rgb_sources = set(rgb_sels)
a_addr_strs = [s for i, s in enumerate(a_addr_strs) if i in a_sources]
rgb_addr_strs = [s for i, s in enumerate(rgb_addr_strs) if i in rgb_sources]
print(", ".join([*a_addr_strs, *rgb_addr_strs]), ":")
#print(", ".join(a_addr_strs), ":")
print(f" {a_out_str} = {a_temp_str} = {a_op.ljust(6)} {' '.join(a_swizzle_sel)}", ",")
#print(", ".join(rgb_addr_strs), ":")
print(f" {rgb_out_str} = {rgb_temp_str} = {rgb_op.ljust(6)} {' '.join(rgb_swizzle_sel)}", ";")
def disassemble(code):
assert len(code) == 6, len(code)
type = US_CMN_INST.TYPE(code)
if type == US_CMN_INST.TYPE.US_INST_TYPE_OUT:
disassemble_alu(code, is_output=True)
elif type == US_CMN_INST.TYPE.US_INST_TYPE_ALU:
disassemble_alu(code, is_output=False)
else:
assert False, US_CMN_INST._TYPE(code[ix + 0])
def parse_hex(s):
assert s.startswith('0x')
return int(s.removeprefix('0x'), 16)
if __name__ == "__main__":
filename = sys.argv[1]
with open(filename) as f:
buf = f.read()
code = [parse_hex(c.strip()) for c in buf.split(',') if c.strip()]
for i in range(len(code) // 6):
start = (i + 0) * 6
end = (i + 1) * 6
disassemble(code[start:end])
print()