blob: 37921935b4ad452a2fe624a3a471d512bfe7de9e [file] [log] [blame]
/*
* Copyright (C) 2022 Collabora, Ltd.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
#include "bi_builder.h"
#include "bi_test.h"
#include "va_compiler.h"
#include "valhall_enums.h"
#include <gtest/gtest.h>
static void
strip_nops(bi_context *ctx)
{
bi_foreach_instr_global_safe(ctx, I) {
if (I->op == BI_OPCODE_NOP)
bi_remove_instruction(I);
}
}
#define CASE(shader_stage, test) \
do { \
bi_builder *A = bit_builder(mem_ctx); \
bi_builder *B = bit_builder(mem_ctx); \
{ \
UNUSED bi_builder *b = A; \
A->shader->stage = MESA_SHADER_##shader_stage; \
test; \
} \
strip_nops(A->shader); \
va_insert_flow_control_nops(A->shader); \
{ \
UNUSED bi_builder *b = B; \
B->shader->stage = MESA_SHADER_##shader_stage; \
test; \
} \
ASSERT_SHADER_EQUAL(A->shader, B->shader); \
} while (0)
#define flow(f) bi_nop(b)->flow = VA_FLOW_##f
class InsertFlow : public testing::Test {
protected:
InsertFlow()
{
mem_ctx = ralloc_context(NULL);
}
~InsertFlow()
{
ralloc_free(mem_ctx);
}
void *mem_ctx;
};
TEST_F(InsertFlow, PreserveEmptyShader)
{
CASE(FRAGMENT, {});
}
TEST_F(InsertFlow, TilebufferWait7)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT);
bi_blend_to(b, bi_register(0), bi_register(4), bi_register(5),
bi_register(6), bi_register(7), bi_register(8),
BI_REGISTER_FORMAT_AUTO, 4, 4);
flow(END);
});
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT);
bi_st_tile(b, bi_register(0), bi_register(4), bi_register(5),
bi_register(6), BI_REGISTER_FORMAT_AUTO, BI_VECSIZE_V4);
flow(END);
});
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT);
bi_ld_tile_to(b, bi_register(0), bi_register(4), bi_register(5),
bi_register(6), BI_REGISTER_FORMAT_AUTO, BI_VECSIZE_V4);
flow(END);
});
}
TEST_F(InsertFlow, AtestWait6AndWait0After)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT0126);
bi_atest_to(b, bi_register(0), bi_register(4), bi_register(5),
bi_fau(BIR_FAU_ATEST_PARAM, false));
flow(WAIT0);
flow(END);
});
}
TEST_F(InsertFlow, ZSEmitWait6)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT0126);
bi_zs_emit_to(b, bi_register(0), bi_register(4), bi_register(5),
bi_register(6), true, true);
flow(END);
});
}
TEST_F(InsertFlow, LoadThenUnrelatedThenUse)
{
CASE(VERTEX, {
bi_ld_attr_imm_to(b, bi_register(16), bi_register(60), bi_register(61),
BI_REGISTER_FORMAT_F32, BI_VECSIZE_V4, 1);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(WAIT0);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(19));
flow(END);
});
}
TEST_F(InsertFlow, SingleLdVar)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_ld_var_buf_imm_f16_to(b, bi_register(2), bi_register(61),
BI_REGISTER_FORMAT_F16, BI_SAMPLE_CENTER,
BI_SOURCE_FORMAT_F16, BI_UPDATE_RETRIEVE,
BI_VECSIZE_V4, 0);
flow(WAIT0);
flow(END);
});
}
TEST_F(InsertFlow, SerializeLdVars)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_ld_var_buf_imm_f16_to(b, bi_register(16), bi_register(61),
BI_REGISTER_FORMAT_F16, BI_SAMPLE_CENTER,
BI_SOURCE_FORMAT_F16, BI_UPDATE_STORE,
BI_VECSIZE_V4, 0);
bi_ld_var_buf_imm_f16_to(b, bi_register(2), bi_register(61),
BI_REGISTER_FORMAT_F16, BI_SAMPLE_CENTER,
BI_SOURCE_FORMAT_F16, BI_UPDATE_RETRIEVE,
BI_VECSIZE_V4, 0);
flow(WAIT0);
bi_ld_var_buf_imm_f16_to(b, bi_register(8), bi_register(61),
BI_REGISTER_FORMAT_F16, BI_SAMPLE_CENTER,
BI_SOURCE_FORMAT_F16, BI_UPDATE_STORE,
BI_VECSIZE_V4, 1);
flow(WAIT0);
flow(END);
});
}
TEST_F(InsertFlow, Clper)
{
CASE(FRAGMENT, {
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
bi_clper_i32_to(b, bi_register(0), bi_register(4), bi_register(8),
BI_INACTIVE_RESULT_ZERO, BI_LANE_OP_NONE,
BI_SUBGROUP_SUBGROUP4);
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(END);
});
}
TEST_F(InsertFlow, TextureImplicit)
{
CASE(FRAGMENT, {
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
bi_tex_single_to(
b, bi_register(0), bi_register(4), bi_register(8), bi_register(12),
false, BI_DIMENSION_2D, BI_REGISTER_FORMAT_F32, false, false,
BI_VA_LOD_MODE_COMPUTED_LOD, false, BI_WRITE_MASK_RGBA, 4);
flow(DISCARD);
flow(WAIT0);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(END);
});
}
TEST_F(InsertFlow, TextureExplicit)
{
CASE(FRAGMENT, {
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
bi_tex_single_to(b, bi_register(0), bi_register(4), bi_register(8),
bi_register(12), false, BI_DIMENSION_2D,
BI_REGISTER_FORMAT_F32, false, false,
BI_VA_LOD_MODE_ZERO_LOD, false, BI_WRITE_MASK_RGBA, 4);
flow(WAIT0);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(END);
});
}
/* A
* / \
* B C
* \ /
* D
*/
TEST_F(InsertFlow, DiamondCFG)
{
CASE(FRAGMENT, {
bi_block *A = bi_start_block(&b->shader->blocks);
bi_block *B = bit_block(b->shader);
bi_block *C = bit_block(b->shader);
bi_block *D = bit_block(b->shader);
bi_block_add_successor(A, B);
bi_block_add_successor(A, C);
bi_block_add_successor(B, D);
bi_block_add_successor(C, D);
/* B uses helper invocations, no other block does.
*
* That means B and C need to discard helpers.
*/
b->cursor = bi_after_block(B);
bi_clper_i32_to(b, bi_register(0), bi_register(4), bi_register(8),
BI_INACTIVE_RESULT_ZERO, BI_LANE_OP_NONE,
BI_SUBGROUP_SUBGROUP4);
flow(DISCARD);
flow(RECONVERGE);
b->cursor = bi_after_block(C);
flow(DISCARD);
bi_fadd_f32_to(b, bi_register(0), bi_register(0), bi_register(0));
flow(RECONVERGE);
b->cursor = bi_after_block(D);
flow(END);
});
}
TEST_F(InsertFlow, BarrierBug)
{
CASE(KERNEL, {
bi_instr *I = bi_store_i32(b, bi_register(0), bi_register(2),
bi_register(4), BI_SEG_NONE, 0);
I->slot = 2;
bi_fadd_f32_to(b, bi_register(10), bi_register(10), bi_register(10));
flow(WAIT2);
bi_barrier(b);
flow(WAIT);
flow(END);
});
}