blob: 931b5cd81daf241f09e93ea7199a3a556b453520 [file] [log] [blame]
/* -*- mesa-c++ -*-
*
* Copyright (c) 2018 Collabora LTD
*
* Author: Gert Wollny <gert.wollny@collabora.com>
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* on the rights to use, copy, modify, merge, publish, distribute, sub
* license, and/or sell copies of the Software, and to permit persons to whom
* the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
#include "tgsi/tgsi_from_mesa.h"
#include "sfn_shader_geometry.h"
#include "sfn_instruction_misc.h"
#include "sfn_instruction_fetch.h"
namespace r600 {
GeometryShaderFromNir::GeometryShaderFromNir(r600_pipe_shader *sh,
r600_pipe_shader_selector &sel,
const r600_shader_key &key):
ShaderFromNirProcessor (PIPE_SHADER_GEOMETRY, sel, sh->shader,
sh->scratch_space_needed),
m_pipe_shader(sh),
m_so_info(&sel.so),
m_first_vertex_emitted(false),
m_offset(0),
m_next_input_ring_offset(0),
m_key(key),
m_num_clip_dist(0),
m_cur_ring_output(0),
m_gs_tri_strip_adj_fix(false)
{
sh_info().atomic_base = key.gs.first_atomic_counter;
}
bool GeometryShaderFromNir::do_emit_load_deref(UNUSED const nir_variable *in_var, UNUSED nir_intrinsic_instr* instr)
{
return false;
}
bool GeometryShaderFromNir::do_emit_store_deref(const nir_variable *out_var, nir_intrinsic_instr* instr)
{
uint32_t write_mask = (1 << instr->num_components) - 1;
GPRVector::Swizzle swz = swizzle_from_mask(instr->num_components);
std::unique_ptr<GPRVector> vec(vec_from_nir_with_fetch_constant(instr->src[1], write_mask, swz));
GPRVector out_value = *vec;
sh_info().output[out_var->data.driver_location].write_mask =
(1 << instr->num_components) - 1;
auto ir = new MemRingOutIntruction(cf_mem_ring, mem_write_ind, out_value,
4 * out_var->data.driver_location,
4, m_export_base);
emit_instruction(ir);
return true;
}
bool GeometryShaderFromNir::scan_sysvalue_access(UNUSED nir_instr *instr)
{
return true;
}
bool GeometryShaderFromNir::do_process_inputs(nir_variable *input)
{
if (input->data.location == VARYING_SLOT_POS ||
input->data.location == VARYING_SLOT_PSIZ ||
input->data.location == VARYING_SLOT_CLIP_DIST0 ||
input->data.location == VARYING_SLOT_CLIP_DIST1 ||
(input->data.location >= VARYING_SLOT_VAR0 &&
input->data.location <= VARYING_SLOT_VAR31) ||
(input->data.location >= VARYING_SLOT_TEX0 &&
input->data.location <= VARYING_SLOT_TEX7)) {
r600_shader_io& io = sh_info().input[input->data.driver_location];
tgsi_get_gl_varying_semantic(static_cast<gl_varying_slot>( input->data.location),
true, &io.name, &io.sid);
io.ring_offset = 16 * input->data.driver_location;
++sh_info().ninput;
m_next_input_ring_offset += 16;
return true;
}
return false;
}
bool GeometryShaderFromNir::do_process_outputs(nir_variable *output)
{
if (output->data.location == VARYING_SLOT_COL0 ||
output->data.location == VARYING_SLOT_COL1 ||
(output->data.location >= VARYING_SLOT_VAR0 &&
output->data.location <= VARYING_SLOT_VAR31) ||
(output->data.location >= VARYING_SLOT_TEX0 &&
output->data.location <= VARYING_SLOT_TEX7) ||
output->data.location == VARYING_SLOT_BFC0 ||
output->data.location == VARYING_SLOT_BFC1 ||
output->data.location == VARYING_SLOT_CLIP_VERTEX ||
output->data.location == VARYING_SLOT_CLIP_DIST0 ||
output->data.location == VARYING_SLOT_CLIP_DIST1 ||
output->data.location == VARYING_SLOT_PRIMITIVE_ID ||
output->data.location == VARYING_SLOT_POS ||
output->data.location == VARYING_SLOT_PSIZ ||
output->data.location == VARYING_SLOT_LAYER ||
output->data.location == VARYING_SLOT_VIEWPORT ||
output->data.location == VARYING_SLOT_FOGC) {
r600_shader_io& io = sh_info().output[output->data.driver_location];
tgsi_get_gl_varying_semantic(static_cast<gl_varying_slot>( output->data.location),
true, &io.name, &io.sid);
evaluate_spi_sid(io);
++sh_info().noutput;
if (output->data.location == VARYING_SLOT_CLIP_DIST0 ||
output->data.location == VARYING_SLOT_CLIP_DIST1) {
m_num_clip_dist += 4;
}
return true;
}
return false;
}
bool GeometryShaderFromNir::allocate_reserved_registers()
{
const int sel[6] = {0, 0 ,0, 1, 1, 1};
const int chan[6] = {0, 1 ,3, 0, 1, 2};
increment_reserved_registers();
increment_reserved_registers();
/* Reserve registers used by the shaders (should check how many
* components are actually used */
for (int i = 0; i < 6; ++i) {
auto reg = new GPRValue(sel[i], chan[i]);
reg->set_as_input();
m_per_vertex_offsets[i].reset(reg);
inject_register(sel[i], chan[i], m_per_vertex_offsets[i], false);
}
auto reg = new GPRValue(0, 2);
reg->set_as_input();
m_primitive_id.reset(reg);
inject_register(0, 2, m_primitive_id, false);
reg = new GPRValue(1, 3);
reg->set_as_input();
m_invocation_id.reset(reg);
inject_register(1, 3, m_invocation_id, false);
m_export_base = get_temp_register();
emit_instruction(new AluInstruction(op1_mov, m_export_base, Value::zero, {alu_write, alu_last_instr}));
sh_info().ring_item_sizes[0] = m_next_input_ring_offset;
if (m_key.gs.tri_strip_adj_fix)
emit_adj_fix();
return true;
}
void GeometryShaderFromNir::emit_adj_fix()
{
PValue adjhelp0(new GPRValue(m_export_base->sel(), 1));
emit_instruction(op2_and_int, adjhelp0, {m_primitive_id, Value::one_i}, {alu_write, alu_last_instr});
int help2 = allocate_temp_register();
int reg_indices[6];
int reg_chanels[6] = {0, 1, 2, 3, 2, 3};
int rotate_indices[6] = {4, 5, 0, 1, 2, 3};
reg_indices[0] = reg_indices[1] = reg_indices[2] = reg_indices[3] = help2;
reg_indices[4] = reg_indices[5] = m_export_base->sel();
std::array<PValue, 6> adjhelp;
AluInstruction *ir = nullptr;
for (int i = 0; i < 6; i++) {
adjhelp[i].reset(new GPRValue(reg_indices[i], reg_chanels[i]));
ir = new AluInstruction(op3_cnde_int, adjhelp[i],
{adjhelp0, m_per_vertex_offsets[i],
m_per_vertex_offsets[rotate_indices[i]]},
{alu_write});
if (i == 3)
ir->set_flag(alu_last_instr);
emit_instruction(ir);
}
ir->set_flag(alu_last_instr);
for (int i = 0; i < 6; i++)
m_per_vertex_offsets[i] = adjhelp[i];
}
bool GeometryShaderFromNir::emit_deref_instruction_override(nir_deref_instr* instr)
{
if (instr->deref_type == nir_deref_type_array) {
auto var = get_deref_location(instr->parent);
ArrayDeref ad = {var, &instr->arr.index};
assert(instr->dest.is_ssa);
m_in_array_deref[instr->dest.ssa.index] = ad;
/* Problem: nir_intrinsice_load_deref tries to lookup the
* variable, and will not find it, need to override that too */
return true;
}
return false;
}
bool GeometryShaderFromNir::emit_intrinsic_instruction_override(nir_intrinsic_instr* instr)
{
switch (instr->intrinsic) {
case nir_intrinsic_load_deref: {
auto& src = instr->src[0];
assert(src.is_ssa);
auto array = m_in_array_deref.find(src.ssa->index);
if (array != m_in_array_deref.end())
return emit_load_from_array(instr, array->second);
} break;
case nir_intrinsic_emit_vertex:
return emit_vertex(instr, false);
case nir_intrinsic_end_primitive:
return emit_vertex(instr, true);
case nir_intrinsic_load_primitive_id:
return load_preloaded_value(instr->dest, 0, m_primitive_id);
case nir_intrinsic_load_invocation_id:
return load_preloaded_value(instr->dest, 0, m_invocation_id);
default:
;
}
return false;
}
bool GeometryShaderFromNir::emit_vertex(nir_intrinsic_instr* instr, bool cut)
{
int stream = nir_intrinsic_stream_id(instr);
assert(stream < 4);
emit_instruction(new EmitVertex(stream, cut));
if (!cut)
emit_instruction(new AluInstruction(op2_add_int, m_export_base, m_export_base,
PValue(new LiteralValue(sh_info().noutput)),
{alu_write, alu_last_instr}));
return true;
}
bool GeometryShaderFromNir::emit_load_from_array(nir_intrinsic_instr* instr,
const ArrayDeref& array_deref)
{
auto dest = vec_from_nir(instr->dest, instr->num_components);
const nir_load_const_instr* literal_index = nullptr;
if (array_deref.index->is_ssa)
literal_index = get_literal_constant(array_deref.index->ssa->index);
if (!literal_index) {
sfn_log << SfnLog::err << "GS: Indirect input addressing not (yet) supported\n";
return false;
}
assert(literal_index->value[0].u32 < 6);
PValue addr = m_per_vertex_offsets[literal_index->value[0].u32];
auto fetch = new FetchInstruction(vc_fetch, no_index_offset, dest, addr,
16 * array_deref.var->data.driver_location,
R600_GS_RING_CONST_BUFFER, PValue(), bim_none, true);
emit_instruction(fetch);
return true;
}
void GeometryShaderFromNir::do_finalize()
{
if (m_num_clip_dist) {
sh_info().cc_dist_mask = (1 << m_num_clip_dist) - 1;
sh_info().clip_dist_write = (1 << m_num_clip_dist) - 1;
}
}
}