#include #include "holly/background.hpp" #include "holly/core.hpp" #include "holly/core_bits.hpp" #include "holly/holly.hpp" #include "holly/isp_tsp.hpp" #include "holly/region_array.hpp" #include "holly/ta_bits.hpp" #include "holly/ta_fifo_polygon_converter.hpp" #include "holly/ta_global_parameter.hpp" #include "holly/ta_parameter.hpp" #include "holly/ta_vertex_parameter.hpp" #include "holly/texture_memory_alloc5.hpp" #include "holly/video_output.hpp" #include "systembus.hpp" #include "systembus_bits.hpp" #include "maple/maple.hpp" #include "maple/maple_host_command_writer.hpp" #include "maple/maple_bus_bits.hpp" #include "maple/maple_bus_commands.hpp" #include "maple/maple_bus_ft0.hpp" #include "memorymap.hpp" #include "sh7091/sh7091.hpp" #include "sh7091/sh7091_bits.hpp" #include "sh7091/serial.hpp" #include "printf/printf.h" #include "interrupt.hpp" #include "assert.h" #include "math/vec2.hpp" #include "math/vec3.hpp" #include "math/vec4.hpp" #include "math/mat2x2.hpp" #include "math/mat3x3.hpp" #include "math/mat4x4.hpp" #include "math/geometry.hpp" #include "math/transform.hpp" using vec2 = vec<2, float>; using vec3 = vec<3, float>; using vec4 = vec<4, float>; using mat4x4 = mat<4, 4, float>; #include "md5/md5mesh.h" #include "md5/md5anim.h" #include "model/boblamp/boblamp_mesh.h" #include "model/boblamp/boblamp_anim.h" static int joint_ix_sel = 0; static int animation_tick = 0; static int animation_frames = 0; constexpr int ticks_per_animation_frame = 3; constexpr float tick_div = 1.0f / (float)ticks_per_animation_frame; static ft0::data_transfer::data_format data[4]; uint8_t send_buf[1024] __attribute__((aligned(32))); uint8_t recv_buf[1024] __attribute__((aligned(32))); void do_get_condition() { auto writer = maple::host_command_writer(send_buf, recv_buf); using command_type = maple::get_condition; using response_type = maple::data_transfer; auto [host_command, host_response] = writer.append_command_all_ports(); for (int port = 0; port < 4; port++) { auto& data_fields = host_command[port].bus_data.data_fields; data_fields.function_type = std::byteswap(function_type::controller); } maple::dma_start(send_buf, writer.send_offset, recv_buf, writer.recv_offset); for (uint8_t port = 0; port < 4; port++) { auto& bus_data = host_response[port].bus_data; if (bus_data.command_code != response_type::command_code) { return; } auto& data_fields = bus_data.data_fields; if ((std::byteswap(data_fields.function_type) & function_type::controller) == 0) { return; } data[port].digital_button = data_fields.data.digital_button; for (int i = 0; i < 6; i++) { data[port].analog_coordinate_axis[i] = data_fields.data.analog_coordinate_axis[i]; } } } void vbr100() { serial::string("vbr100\n"); interrupt_exception(); } void vbr400() { serial::string("vbr400\n"); interrupt_exception(); } const int framebuffer_width = 640; const int framebuffer_height = 480; const int tile_width = framebuffer_width / 32; const int tile_height = framebuffer_height / 32; constexpr uint32_t ta_alloc = 0 | ta_alloc_ctrl::pt_opb::no_list | ta_alloc_ctrl::tm_opb::no_list | ta_alloc_ctrl::t_opb::no_list | ta_alloc_ctrl::om_opb::no_list | ta_alloc_ctrl::o_opb::_32x4byte; constexpr int ta_cont_count = 1; constexpr struct opb_size opb_size[ta_cont_count] = { { .opaque = 32 * 4, .opaque_modifier = 0, .translucent = 0, .translucent_modifier = 0, .punch_through = 0 } }; static volatile int ta_in_use = 0; static volatile int core_in_use = 0; static volatile int next_frame = 0; static volatile int framebuffer_ix = 0; static volatile int next_frame_ix = 0; static inline void pump_events(uint32_t istnrm) { if (istnrm & istnrm::v_blank_in) { system.ISTNRM = istnrm::v_blank_in; next_frame = 1; holly.FB_R_SOF1 = texture_memory_alloc.framebuffer[next_frame_ix].start; } if (istnrm & istnrm::end_of_render_tsp) { system.ISTNRM = istnrm::end_of_render_tsp | istnrm::end_of_render_isp | istnrm::end_of_render_video; next_frame_ix = framebuffer_ix; framebuffer_ix += 1; if (framebuffer_ix >= 3) framebuffer_ix = 0; core_in_use = 0; } if (istnrm & istnrm::end_of_transferring_opaque_list) { system.ISTNRM = istnrm::end_of_transferring_opaque_list; core_in_use = 1; core_start_render2(texture_memory_alloc.region_array.start, texture_memory_alloc.isp_tsp_parameters.start, texture_memory_alloc.background[0].start, texture_memory_alloc.framebuffer[framebuffer_ix].start, framebuffer_width); assert(ta_in_use); ta_in_use = 0; } } void vbr600() { uint32_t sr; asm volatile ("stc sr,%0" : "=r" (sr)); sr |= sh::sr::imask(15); asm volatile ("ldc %0,sr" : : "r" (sr)); //serial::string("imask\n"); //check_pipeline(); if (sh7091.CCN.EXPEVT == 0 && sh7091.CCN.INTEVT == 0x320) { uint32_t istnrm = system.ISTNRM; uint32_t isterr = system.ISTERR; if (isterr) { serial::string("isterr: "); serial::integer(system.ISTERR); } pump_events(istnrm); sr &= ~sh::sr::imask(15); asm volatile ("ldc %0,sr" : : "r" (sr)); return; } serial::string("vbr600\n"); interrupt_exception(); } void global_polygon_type_0(ta_parameter_writer& writer, uint32_t para_control_obj_control, uint32_t tsp_instruction_word, uint32_t texture_control_word, const float a = 1.0f, const float r = 1.0f, const float g = 1.0f, const float b = 1.0f ) { const uint32_t parameter_control_word = para_control::para_type::polygon_or_modifier_volume | obj_control::col_type::floating_color | obj_control::gouraud | para_control_obj_control ; const uint32_t isp_tsp_instruction_word = isp_tsp_instruction_word::depth_compare_mode::greater | isp_tsp_instruction_word::culling_mode::no_culling ; writer.append() = ta_global_parameter::polygon_type_0(parameter_control_word, isp_tsp_instruction_word, tsp_instruction_word, texture_control_word, 0, 0 ); } void transfer_triangle(ta_parameter_writer& writer, vec3 ap, vec3 bp, vec3 cp, vec3 ac, vec3 bc, vec3 cc ) { if (ap.z < 0 || bp.z < 0 || cp.z < 0) return; writer.append() = ta_vertex_parameter::polygon_type_1(polygon_vertex_parameter_control_word(false), ap.x, ap.y, ap.z, 1.0, ac.x, ac.y, ac.z); writer.append() = ta_vertex_parameter::polygon_type_1(polygon_vertex_parameter_control_word(false), bp.x, bp.y, bp.z, 1.0, bc.x, bc.y, bc.z); writer.append() = ta_vertex_parameter::polygon_type_1(polygon_vertex_parameter_control_word(true), cp.x, cp.y, cp.z, 1.0, cc.x, cc.y, cc.z); } vec4 quaternion_normalize(vec4 q) { float mag = magnitude(q); if (mag > 0.0f) { return q * (1.0f / mag); } else { return q; } } vec4 quaternion_mul_quaternion(vec4 a, vec4 b) { return (vec4){ (a.x * b.w) + (a.w * b.x) + (a.y * b.z) - (a.z * b.y), (a.y * b.w) + (a.w * b.y) + (a.z * b.x) - (a.x * b.z), (a.z * b.w) + (a.w * b.z) + (a.x * b.y) - (a.y * b.x), (a.w * b.w) - (a.x * b.x) - (a.y * b.y) - (a.z * b.z), }; } vec4 quaternion_mul_vec4(vec4 q, vec3 v) { return (vec4){ (q.w * v.x) + (q.y * v.z) - (q.z * v.y), (q.w * v.y) + (q.z * v.x) - (q.x * v.z), (q.w * v.z) + (q.x * v.y) - (q.y * v.x), - (q.x * v.x) - (q.y * v.y) - (q.z * v.z), }; } vec3 quaternion_rotate_point(vec4 q, vec3 v) { vec4 neg = { -q.x, -q.y, -q.z, q.w, }; vec4 qv = quaternion_mul_quaternion(quaternion_mul_vec4(q, v), quaternion_normalize(neg)); return (vec3){qv.x, qv.y, qv.z}; } static inline float quaternion_unit_w(vec4 q) { float t = 1.0 - (q.x * q.x) - (q.y * q.y) - (q.z * q.z); if (t < 0.0) return 0.0; else return -sqrt(t); } struct pos_orient { vec3 pos; vec4 orient; }; pos_orient skeleton0[64]; pos_orient skeleton1[64]; void build_skeleton(const md5_anim * anim, int frame_ix, pos_orient * skeleton) { for (int i = 0; i < anim->num_joints; i++) { md5_anim_base_frame * base_frame = &anim->base_frame[i]; vec3 pos = base_frame->pos; vec4 orient = base_frame->orient; float * frame = anim->frame[frame_ix]; md5_anim_hierarchy * hierarchy = &anim->hierarchy[i]; assert(hierarchy->flags == 0b111111); pos.x = frame[hierarchy->start_index + 0]; pos.y = frame[hierarchy->start_index + 1]; pos.z = frame[hierarchy->start_index + 2]; orient.x = frame[hierarchy->start_index + 3]; orient.y = frame[hierarchy->start_index + 4]; orient.z = frame[hierarchy->start_index + 5]; orient.w = quaternion_unit_w(orient); if (hierarchy->parent_index >= 0) { pos_orient * parent = &skeleton[hierarchy->parent_index]; vec3 rpos = quaternion_rotate_point(parent->orient, pos); pos = rpos + parent->pos; orient = quaternion_mul_quaternion(parent->orient, orient); orient = quaternion_normalize(orient); } skeleton[i].pos = pos; skeleton[i].orient = orient; } } void interpolate_skeleton(int length, pos_orient * a, pos_orient * b, float lerp) { for (int i = 0; i < length; i++) { a[i].pos = a[i].pos + (b[i].pos - a[i].pos) * lerp; a[i].orient = a[i].orient + (b[i].orient - a[i].orient) * lerp; } } vec3 vertex_weights(const md5_mesh_joint * joints, const md5_mesh_mesh * mesh, const md5_mesh_vert * v) { const md5_mesh_weight * weights = &mesh->weights[v->weight_index]; vec3 sum = {0, 0, 0}; for (int i = 0; i < v->weight_elem; i++) { const md5_mesh_weight * weight = &weights[i]; //const md5_mesh_joint * joint = &joints[weight->joint_index]; pos_orient * joint = &skeleton0[weight->joint_index]; vec3 rv = quaternion_rotate_point(joint->orient, weight->pos); sum += (joint->pos + rv) * weight->weight_value; } return sum; } vec3 vertex_weight_color(const md5_mesh_joint * joints, const md5_mesh_mesh * mesh, const md5_mesh_vert * v) { const md5_mesh_weight * weights = &mesh->weights[v->weight_index]; for (int i = 0; i < v->weight_elem; i++) { const md5_mesh_weight * weight = &weights[i]; if (weight->joint_index == joint_ix_sel) { return {weight->weight_value, 1.0f - weight->weight_value, 0.0}; } } return {0.0, 0.0, 1.0}; } static inline vec3 screen_transform(vec3 v) { float x2 = 640 / 2.0; float y2 = 480 / 2.0; float iz = 1.0f / v.z; return { v.x * iz * y2 + x2, v.y * iz * y2 + y2, iz, }; } float light_intensity(vec3 l1, vec3 n) { float intensity = 0.2f; { float n_dot_l = dot(n, l1); if (n_dot_l > 0) intensity += 0.9f * n_dot_l * (inverse_length(n) * inverse_length(l1)); } if (intensity > 1.0f) intensity = 1.0f; return intensity; } void transfer_mesh(ta_parameter_writer& writer, const mat4x4& screen_trans, const md5_mesh_joint * joints, const md5_mesh_mesh * mesh) { const vec3 light_pos = {1.2f, 1.0f, -2.0f}; for (int i = 0; i < mesh->num_tris; i++) { const md5_mesh_tri * tri = &mesh->tris[i]; const md5_mesh_vert * av = &mesh->verts[tri->vert_index.a]; const md5_mesh_vert * bv = &mesh->verts[tri->vert_index.b]; const md5_mesh_vert * cv = &mesh->verts[tri->vert_index.c]; vec3 ap = screen_trans * vertex_weights(joints, mesh, av); vec3 bp = screen_trans * vertex_weights(joints, mesh, bv); vec3 cp = screen_trans * vertex_weights(joints, mesh, cv); vec3 n = -normalize(cross(bp - ap, cp - ap)); vec3 a_light_dir = normalize(light_pos - ap); vec3 b_light_dir = normalize(light_pos - bp); vec3 c_light_dir = normalize(light_pos - cp); float a_diffuse = max(dot(n, a_light_dir), 0.0f); float b_diffuse = max(dot(n, b_light_dir), 0.0f); float c_diffuse = max(dot(n, c_light_dir), 0.0f); vec3 ac = vertex_weight_color(joints, mesh, av); vec3 bc = vertex_weight_color(joints, mesh, bv); vec3 cc = vertex_weight_color(joints, mesh, cv); transfer_triangle(writer, screen_transform(ap), screen_transform(bp), screen_transform(cp), ac * a_diffuse, bc * b_diffuse, cc * c_diffuse ); } } void transfer_scene(ta_parameter_writer& writer, const mat4x4& screen_trans) { uint32_t control = para_control::list_type::opaque; uint32_t tsp_instruction_word = tsp_instruction_word::src_alpha_instr::one | tsp_instruction_word::dst_alpha_instr::zero | tsp_instruction_word::fog_control::no_fog | tsp_instruction_word::texture_shading_instruction::decal; uint32_t texture_control_word = 0; global_polygon_type_0(writer, control, tsp_instruction_word, texture_control_word); int frame_ix0 = animation_tick / ticks_per_animation_frame; int frame_ix1 = frame_ix0 + 1; if (frame_ix1 >= animation_frames) frame_ix1 = 0; md5_anim * anim = &boblamp_anim; build_skeleton(anim, frame_ix0, skeleton0); build_skeleton(anim, frame_ix1, skeleton1); float lerp = (float)(animation_tick - (frame_ix0 * ticks_per_animation_frame)) * tick_div; interpolate_skeleton(anim->num_joints, skeleton0, skeleton1, lerp); for (int i = 0; i < boblamp_mesh.num_meshes; i++) { transfer_mesh(writer, screen_trans, boblamp_mesh.joints, &boblamp_mesh.meshes[i]); } writer.append() = ta_global_parameter::end_of_list(para_control::para_type::end_of_list); } void update_maple(struct md5_mesh * m, struct md5_anim * a) { int ra = ft0::data_transfer::digital_button::ra(data[0].digital_button) == 0; int la = ft0::data_transfer::digital_button::la(data[0].digital_button) == 0; int ua = ft0::data_transfer::digital_button::ua(data[0].digital_button) == 0; int da = ft0::data_transfer::digital_button::da(data[0].digital_button) == 0; static int last_ra = 0; static int last_la = 0; static int last_ua = 0; static int last_da = 0; if (ra && last_ra == 0) { joint_ix_sel += 1; printf("joint_ix_sel: %d\n", joint_ix_sel); if (joint_ix_sel >= m->num_joints) joint_ix_sel = 0; } if (la && last_la == 0) { joint_ix_sel -= 1; printf("joint_ix_sel: %d\n", joint_ix_sel); if (joint_ix_sel < 0) joint_ix_sel = m->num_joints - 1; } /* if (ua && last_ua == 0) { frame_ix_sel += 1; printf("frame_ix_sel: %d\n", frame_ix_sel); if (frame_ix_sel >= a->num_frames) frame_ix_sel = 0; } if (da && last_da == 0) { frame_ix_sel -= 1; printf("frame_ix_sel: %d\n", frame_ix_sel); if (frame_ix_sel < 0) frame_ix_sel = a->num_frames - 1; } */ last_ra = ra; last_la = la; last_ua = ua; last_da = da; } uint8_t __attribute__((aligned(32))) ta_parameter_buf[1024 * 1024]; int main() { sh7091.TMU.TSTR = 0; // stop all timers sh7091.TMU.TOCR = tmu::tocr::tcoe::tclk_is_external_clock_or_input_capture; sh7091.TMU.TCR0 = tmu::tcr0::tpsc::p_phi_256; // 256 / 50MHz = 5.12 μs ; underflows in ~1 hour sh7091.TMU.TCOR0 = 0xffff'ffff; sh7091.TMU.TCNT0 = 0xffff'ffff; sh7091.TMU.TSTR = tmu::tstr::str0::counter_start; serial::init(0); interrupt_init(); holly.SOFTRESET = softreset::pipeline_soft_reset | softreset::ta_soft_reset; holly.SOFTRESET = 0; core_init(); holly.FPU_SHAD_SCALE = fpu_shad_scale::simple_shadow_enable::parameter_selection_volume_mode; system.IML6NRM = istnrm::end_of_render_tsp | istnrm::v_blank_in | istnrm::end_of_transferring_opaque_list; region_array_multipass(tile_width, tile_height, opb_size, ta_cont_count, texture_memory_alloc.region_array.start, texture_memory_alloc.object_list.start); background_parameter2(texture_memory_alloc.background[0].start, 0xff202040); ta_parameter_writer writer = ta_parameter_writer(ta_parameter_buf, (sizeof (ta_parameter_buf))); video_output::set_mode_vga(); mat4x4 screen_trans = { 1, 0, 0, 0, 0, 0, -1, 0, 0, 1, 0, 40, 0, 0, 0, 1, }; screen_trans = translate((vec3){0, 30, 0}) * screen_trans; animation_tick = 0; animation_frames = boblamp_anim.num_frames; do_get_condition(); while (1) { maple::dma_wait_complete(); do_get_condition(); update_maple(&boblamp_mesh, &boblamp_anim); //screen_trans = screen_trans * rotate_z(0.01f); writer.offset = 0; transfer_scene(writer, screen_trans); while (ta_in_use); while (core_in_use); ta_in_use = 1; ta_polygon_converter_init2(texture_memory_alloc.isp_tsp_parameters.start, texture_memory_alloc.isp_tsp_parameters.end, texture_memory_alloc.object_list.start, texture_memory_alloc.object_list.end, opb_size[0].total(), ta_alloc, tile_width, tile_height); ta_polygon_converter_writeback(writer.buf, writer.offset); ta_polygon_converter_transfer(writer.buf, writer.offset); while (next_frame == 0); next_frame = 0; // increment tick animation_tick += 1; if (animation_tick >= animation_frames * ticks_per_animation_frame) animation_tick = 0; } }