The previous texture_memory_alloc.hpp was written based on an incorrect understanding of the "32-bit" and "64-bit" texture memory address mapping. The primary motivation is to rearrange the texture memory address map so that "textures" (64-bit access) do not overlap with 32-bit accesses, such as REGION_BASE or PARAM_BASE.
400 lines
12 KiB
C++
400 lines
12 KiB
C++
#include <cstdint>
|
|
|
|
#include "align.hpp"
|
|
#include "holly/video_output.hpp"
|
|
|
|
#include "holly/holly.hpp"
|
|
#include "holly/core.hpp"
|
|
#include "holly/core_bits.hpp"
|
|
#include "holly/ta_fifo_polygon_converter.hpp"
|
|
#include "holly/ta_parameter.hpp"
|
|
#include "holly/ta_global_parameter.hpp"
|
|
#include "holly/ta_vertex_parameter.hpp"
|
|
#include "holly/isp_tsp.hpp"
|
|
#include "holly/ta_bits.hpp"
|
|
#include "holly/region_array.hpp"
|
|
#include "holly/background.hpp"
|
|
#include "holly/texture_memory_alloc.hpp"
|
|
#include "memorymap.hpp"
|
|
#include "sh7091/sh7091.hpp"
|
|
#include "sh7091/sh7091_bits.hpp"
|
|
#include "sh7091/serial.hpp"
|
|
#include "palette.hpp"
|
|
|
|
#include "geometry/suzanne.hpp"
|
|
#include "geometry/circle.hpp"
|
|
#include "math/vec4.hpp"
|
|
|
|
#include "font/font_bitmap.hpp"
|
|
#include "verite_8x16.hpp"
|
|
#include "string.hpp"
|
|
|
|
constexpr float half_degree = 0.01745329f / 2;
|
|
|
|
#define MODEL suzanne
|
|
|
|
vec3 rotate(const vec3& vertex,
|
|
const float theta)
|
|
{
|
|
float x = vertex.x;
|
|
float y = vertex.y;
|
|
float z = vertex.z;
|
|
float t;
|
|
|
|
t = y * cos(theta) - z * sin(theta);
|
|
z = y * sin(theta) + z * cos(theta);
|
|
y = t;
|
|
|
|
float theta2 = 3.14 * sin(theta / 2);
|
|
|
|
t = x * cos(theta2) - z * sin(theta2);
|
|
z = x * sin(theta2) + z * cos(theta2);
|
|
x = t;
|
|
|
|
return vec3(x, y, z);
|
|
}
|
|
|
|
void transform(ta_parameter_writer& parameter,
|
|
const uint32_t face_ix,
|
|
const float theta,
|
|
const vec3 lights[3])
|
|
{
|
|
const uint32_t parameter_control_word = para_control::para_type::polygon_or_modifier_volume
|
|
| para_control::list_type::opaque
|
|
| obj_control::col_type::floating_color
|
|
| obj_control::gouraud;
|
|
|
|
const uint32_t isp_tsp_instruction_word = isp_tsp_instruction_word::depth_compare_mode::greater
|
|
| isp_tsp_instruction_word::culling_mode::cull_if_positive;
|
|
|
|
const uint32_t tsp_instruction_word = tsp_instruction_word::src_alpha_instr::one
|
|
| tsp_instruction_word::dst_alpha_instr::zero
|
|
| tsp_instruction_word::fog_control::no_fog;
|
|
|
|
parameter.append<ta_global_parameter::polygon_type_0>() =
|
|
ta_global_parameter::polygon_type_0(parameter_control_word,
|
|
isp_tsp_instruction_word,
|
|
tsp_instruction_word,
|
|
0, // texture_control_word
|
|
0, // data_size_for_sort_dma
|
|
0 // next_address_for_sort_dma
|
|
);
|
|
auto& face = MODEL::faces[face_ix];
|
|
|
|
constexpr uint32_t strip_length = 3;
|
|
for (uint32_t i = 0; i < strip_length; i++) {
|
|
// world transform
|
|
uint32_t vertex_ix = face[i].vertex;
|
|
auto& vertex = MODEL::vertices[vertex_ix];
|
|
auto point = rotate(vertex, theta);
|
|
|
|
// lighting transform
|
|
uint32_t normal_ix = face[i].normal;
|
|
auto& normal = MODEL::normals[normal_ix];
|
|
auto n = rotate(normal, theta);
|
|
|
|
vec4 color = {0.2, 0.2, 0.2, 1.0};
|
|
|
|
// intensity calculation
|
|
{
|
|
auto l = lights[0] - point;
|
|
auto n_dot_l = dot(n, l);
|
|
if (n_dot_l > 0) {
|
|
color.x += 0.6 * n_dot_l / (length(n) * length(l));
|
|
}
|
|
}
|
|
|
|
{
|
|
auto l = lights[1] - point;
|
|
auto n_dot_l = dot(n, l);
|
|
if (n_dot_l > 0) {
|
|
color.y += 0.6 * n_dot_l / (length(n) * length(l));
|
|
}
|
|
}
|
|
|
|
{
|
|
auto l = lights[2] - point;
|
|
auto n_dot_l = dot(n, l);
|
|
if (n_dot_l > 0) {
|
|
color.z += 0.6 * n_dot_l / (length(n) * length(l));
|
|
}
|
|
}
|
|
|
|
float x = point.x;
|
|
float y = point.y;
|
|
float z = point.z;
|
|
|
|
x *= 10;
|
|
y *= 10;
|
|
z *= 10;
|
|
|
|
// camera transform
|
|
z += 20;
|
|
|
|
// perspective
|
|
x = x / z;
|
|
y = y / z;
|
|
|
|
// screen space transform
|
|
x *= 240.f;
|
|
y *= 240.f;
|
|
x += 320.f;
|
|
y += 240.f;
|
|
z = 1 / z;
|
|
|
|
bool end_of_strip = i == strip_length - 1;
|
|
parameter.append<ta_vertex_parameter::polygon_type_1>() =
|
|
ta_vertex_parameter::polygon_type_1(polygon_vertex_parameter_control_word(end_of_strip),
|
|
x, y, z,
|
|
color.w, // alpha
|
|
color.x, // r
|
|
color.y, // g
|
|
color.z // b
|
|
);
|
|
}
|
|
}
|
|
|
|
void transform2(ta_parameter_writer& parameter,
|
|
const vec3& pos,
|
|
const vec4& color)
|
|
{
|
|
const uint32_t parameter_control_word = para_control::para_type::polygon_or_modifier_volume
|
|
| para_control::list_type::opaque
|
|
| obj_control::col_type::floating_color
|
|
| obj_control::gouraud;
|
|
|
|
const uint32_t isp_tsp_instruction_word = isp_tsp_instruction_word::depth_compare_mode::greater
|
|
| isp_tsp_instruction_word::culling_mode::no_culling;
|
|
|
|
const uint32_t tsp_instruction_word = tsp_instruction_word::src_alpha_instr::one
|
|
| tsp_instruction_word::dst_alpha_instr::zero
|
|
| tsp_instruction_word::fog_control::no_fog;
|
|
|
|
parameter.append<ta_global_parameter::polygon_type_0>() =
|
|
ta_global_parameter::polygon_type_0(parameter_control_word,
|
|
isp_tsp_instruction_word,
|
|
tsp_instruction_word,
|
|
0, // texture_control_word
|
|
0, // data_size_for_sort_dma
|
|
0 // next_address_for_sort_dma
|
|
);
|
|
|
|
constexpr vec3 triangle[] = {
|
|
{ 0.f, -1.f, 0.f},
|
|
{-1.f, 1.f, 0.f},
|
|
{ 1.f, 1.f, 0.f},
|
|
};
|
|
|
|
constexpr uint32_t strip_length = 3;
|
|
for (uint32_t i = 0; i < strip_length; i++) {
|
|
float x = triangle[i].x;
|
|
float y = triangle[i].y;
|
|
float z = triangle[i].z;
|
|
|
|
x *= 0.2;
|
|
y *= 0.2;
|
|
z *= 0.2;
|
|
|
|
x += pos.x;
|
|
y += pos.y;
|
|
z += pos.z;
|
|
|
|
// camera transform
|
|
z += 20;
|
|
|
|
// perspective
|
|
x = x / z;
|
|
y = y / z;
|
|
|
|
// screen space transform
|
|
x *= 240.f;
|
|
y *= 240.f;
|
|
x += 320.f;
|
|
y += 240.f;
|
|
z = 1 / z;
|
|
|
|
bool end_of_strip = i == strip_length - 1;
|
|
parameter.append<ta_vertex_parameter::polygon_type_1>() =
|
|
ta_vertex_parameter::polygon_type_1(polygon_vertex_parameter_control_word(end_of_strip),
|
|
x, y, z,
|
|
color.w, // alpha
|
|
color.x, // r
|
|
color.y, // g
|
|
color.z // b
|
|
);
|
|
}
|
|
}
|
|
|
|
void init_texture_memory(const struct opb_size& opb_size)
|
|
{
|
|
region_array2(640 / 32, // width
|
|
480 / 32, // height
|
|
opb_size
|
|
);
|
|
|
|
background_parameter(0xff220000);
|
|
}
|
|
|
|
uint32_t _ta_parameter_buf[((32 * 8192) + 32) / 4];
|
|
|
|
static inline void label_number(ta_parameter_writer& parameter,
|
|
const char * label,
|
|
const uint32_t len,
|
|
const uint32_t number,
|
|
const uint32_t row)
|
|
{
|
|
constexpr uint32_t max_label_len = 10;
|
|
char buf[8];
|
|
|
|
string::hex(buf, 8, number);
|
|
font_bitmap::transform_string(parameter,
|
|
8, 16, // texture
|
|
8, 16, // glyph
|
|
16 + (8 * (max_label_len - len)), // position x
|
|
16 * row, // position y
|
|
label, len,
|
|
para_control::list_type::opaque);
|
|
font_bitmap::transform_string(parameter,
|
|
8, 16, // texture
|
|
8, 16, // glyph
|
|
16 + (8 * (max_label_len + 1)), // position x
|
|
16 * row, // position y
|
|
buf, 8,
|
|
para_control::list_type::opaque);
|
|
}
|
|
|
|
void main()
|
|
{
|
|
sh7091.TMU.TSTR = 0; // stop all timers
|
|
sh7091.TMU.TOCR = tmu::tocr::tcoe::tclk_is_external_clock_or_input_capture;
|
|
sh7091.TMU.TCR0 = tmu::tcr0::tpsc::p_phi_256; // 256 / 50MHz = 5.12 μs ; underflows in ~1 hour
|
|
sh7091.TMU.TCOR0 = 0xffff'ffff;
|
|
sh7091.TMU.TCNT0 = 0xffff'ffff;
|
|
sh7091.TMU.TSTR = tmu::tstr::str0::counter_start;
|
|
|
|
video_output::set_mode_vga();
|
|
|
|
auto src = reinterpret_cast<const uint8_t *>(&_binary_verite_8x16_data_start);
|
|
font_bitmap::inflate(1, // pitch
|
|
8, // width
|
|
16, // height
|
|
8, // texture_width
|
|
16, // texture_height
|
|
src);
|
|
palette_data<3>();
|
|
|
|
// The address of `ta_parameter_buf` must be a multiple of 32 bytes.
|
|
// This is mandatory for ch2-dma to the ta fifo polygon converter.
|
|
uint32_t * ta_parameter_buf = align_32byte(_ta_parameter_buf);
|
|
|
|
constexpr uint32_t ta_alloc = ta_alloc_ctrl::pt_opb::no_list
|
|
| ta_alloc_ctrl::tm_opb::no_list
|
|
| ta_alloc_ctrl::t_opb::no_list
|
|
| ta_alloc_ctrl::om_opb::no_list
|
|
| ta_alloc_ctrl::o_opb::_16x4byte;
|
|
|
|
constexpr struct opb_size opb_size = { .opaque = 16 * 4
|
|
, .opaque_modifier = 0
|
|
, .translucent = 0
|
|
, .translucent_modifier = 0
|
|
, .punch_through = 0
|
|
};
|
|
|
|
holly.SOFTRESET = softreset::pipeline_soft_reset
|
|
| softreset::ta_soft_reset;
|
|
holly.SOFTRESET = 0;
|
|
|
|
core_init();
|
|
init_texture_memory(opb_size);
|
|
|
|
uint32_t frame_ix = 0;
|
|
|
|
float theta = 0;
|
|
vec3 lights[3] = {
|
|
{0.f, 0.f, 0.f},
|
|
{0.f, 0.f, 0.f},
|
|
{0.f, 0.f, 0.f},
|
|
};
|
|
|
|
uint32_t t_transform_start = 0;
|
|
uint32_t t_transform_end = 0;
|
|
uint32_t t_text_start = 0;
|
|
uint32_t t_text_end = 0;
|
|
uint32_t t_transfer_start = 0;
|
|
uint32_t t_transfer_end = 0;
|
|
uint32_t t_render_start = 0;
|
|
uint32_t t_render_end = 0;
|
|
|
|
while (1) {
|
|
ta_polygon_converter_init(opb_size.total(),
|
|
ta_alloc,
|
|
640 / 32,
|
|
480 / 32);
|
|
auto parameter = ta_parameter_writer(ta_parameter_buf);
|
|
|
|
// transform start
|
|
t_transform_start = sh7091.TMU.TCNT0;
|
|
{
|
|
const float theta2 = 3.14 * 2 * sin(theta / 7);
|
|
|
|
lights[0].x = cos(theta) * 15;
|
|
lights[0].z = sin(theta) * 15;
|
|
|
|
lights[1].x = cos(theta2 + half_degree * 180.f) * 15;
|
|
lights[1].z = sin(theta2 + half_degree * 180.f) * 15;
|
|
|
|
lights[2].x = cos(theta + half_degree * 360.f) * 15;
|
|
lights[2].z = sin(theta + half_degree * 360.f) * 15;
|
|
|
|
for (uint32_t i = 0; i < MODEL::num_faces; i++) {
|
|
transform(parameter, i, theta, lights);
|
|
}
|
|
transform2(parameter, lights[0], {1.f, 0.f, 0.f, 1.f});
|
|
transform2(parameter, lights[1], {0.f, 1.f, 0.f, 1.f});
|
|
transform2(parameter, lights[2], {0.f, 0.f, 1.f, 1.f});
|
|
}
|
|
t_transform_end = sh7091.TMU.TCNT0;
|
|
// transform end
|
|
|
|
uint32_t _t_text_start = sh7091.TMU.TCNT0;
|
|
{
|
|
|
|
const uint32_t transform = t_transform_start - t_transform_end;
|
|
label_number(parameter, "transform:", 10, transform, 1);
|
|
|
|
const uint32_t text = t_text_start - t_text_end;
|
|
label_number(parameter, "text:", 5, text, 2);
|
|
|
|
const uint32_t transfer = t_transfer_start - t_transfer_end;
|
|
label_number(parameter, "transfer:", 9, transfer, 3);
|
|
|
|
const uint32_t render = t_render_start - t_render_end;
|
|
label_number(parameter, "render:", 7, render, 4);
|
|
}
|
|
t_text_start = _t_text_start;
|
|
t_text_end = sh7091.TMU.TCNT0;
|
|
|
|
parameter.append<ta_global_parameter::end_of_list>() = ta_global_parameter::end_of_list(para_control::para_type::end_of_list);
|
|
|
|
// transfer start
|
|
t_transfer_start = sh7091.TMU.TCNT0;
|
|
{
|
|
ta_polygon_converter_transfer(ta_parameter_buf, parameter.offset);
|
|
ta_wait_opaque_list();
|
|
}
|
|
t_transfer_end = sh7091.TMU.TCNT0;
|
|
|
|
t_render_start = sh7091.TMU.TCNT0;
|
|
core_start_render(frame_ix);
|
|
core_wait_end_of_render_video();
|
|
t_render_end = sh7091.TMU.TCNT0;
|
|
|
|
while (!spg_status::vsync(holly.SPG_STATUS));
|
|
core_flip(frame_ix);
|
|
while (spg_status::vsync(holly.SPG_STATUS));
|
|
|
|
theta += half_degree * 0.5;
|
|
frame_ix = (frame_ix + 1) & 1;
|
|
}
|
|
}
|