blob: 6715d373e3315070e4490ef00e9a3c2b9f800caf [file] [log] [blame]
/*
* Copyright © 2024 Valve Corporation
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
#include "gl_nir_linker.h"
#include "linker_util.h"
#include "program/symbol_table.h"
#include "util/hash_table.h"
#include "main/shader_types.h"
struct function_sig {
nir_function *func;
struct list_head node;
};
typedef enum {
PARAMETER_LIST_NO_MATCH,
PARAMETER_LIST_EXACT_MATCH,
PARAMETER_LIST_INEXACT_MATCH /* Match requires implicit conversion. */
} parameter_list_match_t;
/**
* Check if two parameter lists match.
*
* list_a Parameters of the function definition.
* list_b Actual parameters passed to the function.
*/
static parameter_list_match_t
parameter_lists_match(bool has_implicit_conversions,
bool has_implicit_int_to_uint_conversion,
nir_parameter *list_a, unsigned num_params_a,
nir_parameter *list_b, unsigned num_params_b)
{
/* The lists have different length and by definition do not match. */
if (num_params_a != num_params_b)
return PARAMETER_LIST_NO_MATCH;
nir_parameter *param_a;
nir_parameter *param_b;
/* This is set to true if there is an inexact match requiring an implicit
* conversion. */
bool inexact_match = false;
for (int i = 0; i < num_params_a; i++) {
param_a = &list_a[i];
param_b = &list_b[i];
if (param_a->type == param_b->type)
continue;
/* Try to find an implicit conversion from actual to param. */
inexact_match = true;
switch (param_a->mode) {
case nir_var_function_in:
if (param_a->implicit_conversion_prohibited ||
!_mesa_glsl_can_implicitly_convert(param_b->type, param_a->type,
has_implicit_conversions,
has_implicit_int_to_uint_conversion))
return PARAMETER_LIST_NO_MATCH;
break;
case nir_var_function_out:
if (!_mesa_glsl_can_implicitly_convert(param_a->type, param_b->type,
has_implicit_conversions,
has_implicit_int_to_uint_conversion))
return PARAMETER_LIST_NO_MATCH;
break;
case nir_var_function_inout:
/* Since there are no bi-directional automatic conversions (e.g.,
* there is int -> float but no float -> int), inout parameters must
* be exact matches.
*/
return PARAMETER_LIST_NO_MATCH;
default:
assert(false);
return PARAMETER_LIST_NO_MATCH;
}
}
if (inexact_match)
return PARAMETER_LIST_INEXACT_MATCH;
else
return PARAMETER_LIST_EXACT_MATCH;
}
/* Classes of parameter match, sorted (mostly) best matches first.
* See is_better_parameter_match() below for the exceptions.
* */
typedef enum {
PARAMETER_EXACT_MATCH,
PARAMETER_FLOAT_TO_DOUBLE,
PARAMETER_INT_TO_FLOAT,
PARAMETER_INT_TO_DOUBLE,
PARAMETER_OTHER_CONVERSION,
} parameter_match_t;
static parameter_match_t
get_parameter_match_type(const nir_parameter *param,
const nir_parameter *actual)
{
const struct glsl_type *from_type;
const struct glsl_type *to_type;
if (param->mode == nir_var_function_out) {
from_type = param->type;
to_type = actual->type;
} else {
from_type = actual->type;
to_type = param->type;
}
if (from_type == to_type)
return PARAMETER_EXACT_MATCH;
if (glsl_type_is_double(to_type)) {
if (glsl_type_is_float(from_type))
return PARAMETER_FLOAT_TO_DOUBLE;
return PARAMETER_INT_TO_DOUBLE;
}
if (glsl_type_is_float(to_type))
return PARAMETER_INT_TO_FLOAT;
/* int -> uint and any other oddball conversions */
return PARAMETER_OTHER_CONVERSION;
}
/* From section 6.1 of the GLSL 4.00 spec (and the ARB_gpu_shader5 spec):
*
* 1. An exact match is better than a match involving any implicit
* conversion.
*
* 2. A match involving an implicit conversion from float to double
* is better than match involving any other implicit conversion.
*
* [XXX: Not in GLSL 4.0: Only in ARB_gpu_shader5:
* 3. A match involving an implicit conversion from either int or uint
* to float is better than a match involving an implicit conversion
* from either int or uint to double.]
*
* If none of the rules above apply to a particular pair of conversions,
* neither conversion is considered better than the other.
*
* --
*
* Notably, the int->uint conversion is *not* considered to be better
* or worse than int/uint->float or int/uint->double.
*/
static bool
is_better_parameter_match(parameter_match_t a_match,
parameter_match_t b_match)
{
if (a_match >= PARAMETER_INT_TO_FLOAT && b_match == PARAMETER_OTHER_CONVERSION)
return false;
return a_match < b_match;
}
/* From section 6.1 of the GLSL 4.00 spec (and the ARB_gpu_shader5 spec):
*
* "A function definition A is considered a better
* match than function definition B if:
*
* * for at least one function argument, the conversion for that argument
* in A is better than the corresponding conversion in B; and
*
* * there is no function argument for which the conversion in B is better
* than the corresponding conversion in A.
*
* If a single function definition is considered a better match than every
* other matching function definition, it will be used. Otherwise, a
* semantic error occurs and the shader will fail to compile."
*/
static bool
is_best_inexact_overload(nir_parameter *actual_parameters,
unsigned num_parameters,
nir_function **matches, int num_matches,
nir_function *sig)
{
for (nir_function **other = matches; other < matches + num_matches; other++) {
if (*other == sig)
continue;
nir_parameter *node_a = sig->params;
nir_parameter *node_b = (*other)->params;
bool better_for_some_parameter = false;
for (unsigned i = 0; i < num_parameters; i++) {
parameter_match_t a_match =
get_parameter_match_type(&node_a[i], &actual_parameters[i]);
parameter_match_t b_match =
get_parameter_match_type(&node_b[i], &actual_parameters[i]);
if (is_better_parameter_match(a_match, b_match))
better_for_some_parameter = true;
if (is_better_parameter_match(b_match, a_match))
return false; /* B is better for this parameter */
}
if (!better_for_some_parameter)
return false; /* A must be better than B for some parameter */
}
return true;
}
static nir_function *
choose_best_inexact_overload(nir_parameter *actual_parameters,
unsigned num_parameters,
nir_function **matches, int num_matches,
bool has_choose_best_inexact_overload)
{
if (num_matches == 0)
return NULL;
if (num_matches == 1)
return *matches;
if (!has_choose_best_inexact_overload)
return NULL;
for (nir_function **sig = matches; sig < matches + num_matches; sig++) {
if (is_best_inexact_overload(actual_parameters, num_parameters,
matches, num_matches, *sig))
return *sig;
}
/* no best candidate */
return NULL;
}
static nir_function *
find_matching_signature(struct list_head *f_list,
nir_parameter *parameters,
unsigned num_parameters,
bool has_implicit_conversions,
bool has_implicit_int_to_uint_conversion)
{
nir_function **inexact_matches = NULL;
nir_function **inexact_matches_temp;
nir_function *match = NULL;
int num_inexact_matches = 0;
/* From page 42 (page 49 of the PDF) of the GLSL 1.20 spec:
*
* "If an exact match is found, the other signatures are ignored, and
* the exact match is used. Otherwise, if no exact match is found, then
* the implicit conversions in Section 4.1.10 "Implicit Conversions" will
* be applied to the calling arguments if this can make their types match
* a signature. In this case, it is a semantic error if there are
* multiple ways to apply these conversions to the actual arguments of a
* call such that the call can be made to match multiple signatures."
*/
list_for_each_entry(struct function_sig, sig, f_list, node) {
switch (parameter_lists_match(has_implicit_conversions,
has_implicit_int_to_uint_conversion,
sig->func->params, sig->func->num_params,
parameters, num_parameters)) {
case PARAMETER_LIST_EXACT_MATCH:
free(inexact_matches);
return sig->func;
case PARAMETER_LIST_INEXACT_MATCH:
/* Subroutine signatures must match exactly */
if (sig->func->is_subroutine)
continue;
inexact_matches_temp = (nir_function **)
realloc(inexact_matches,
sizeof(*inexact_matches) *
(num_inexact_matches + 1));
inexact_matches = inexact_matches_temp;
inexact_matches[num_inexact_matches++] = sig->func;
continue;
case PARAMETER_LIST_NO_MATCH:
continue;
default:
assert(false);
return NULL;
}
}
match = choose_best_inexact_overload(parameters, num_parameters,
inexact_matches, num_inexact_matches,
has_implicit_int_to_uint_conversion);
free(inexact_matches);
return match;
}
static nir_function *
clone_function(struct hash_table *remap_table,
const nir_function *fxn, nir_shader *ns)
{
nir_function *nfxn = nir_function_clone(ns, fxn);
/* Needed for call instructions */
_mesa_hash_table_insert(remap_table, fxn, nfxn);
return nfxn;
}
bool
gl_nir_link_function_calls(struct gl_shader_program *prog,
struct gl_shader *main,
struct gl_linked_shader *linked_sh,
struct gl_shader **shader_list,
unsigned num_shaders)
{
void *mem_ctx = ralloc_context(NULL);
struct hash_table *var_lookup = _mesa_string_hash_table_create(mem_ctx);
struct hash_table *func_lookup = _mesa_string_hash_table_create(mem_ctx);
struct hash_table *remap_table = _mesa_pointer_hash_table_create(mem_ctx);
nir_foreach_variable_in_shader(var, linked_sh->Program->nir) {
_mesa_hash_table_insert(var_lookup, var->name, var);
}
nir_foreach_function(func, linked_sh->Program->nir) {
if (!func->impl)
continue;
struct hash_entry *e = _mesa_hash_table_search(func_lookup, func->name);
if (e) {
struct list_head *f_list = (struct list_head *) e->data;
nir_function *f = find_matching_signature(f_list, func->params,
func->num_params,
main->has_implicit_conversions,
main->has_implicit_int_to_uint_conversion);
if (!f) {
struct function_sig *func_sig = ralloc(mem_ctx, struct function_sig);
func_sig->func = func;
list_add(&func_sig->node, f_list);
}
} else {
struct list_head *func_list = ralloc(mem_ctx, struct list_head);
list_inithead(func_list);
struct function_sig *func_sig = ralloc(mem_ctx, struct function_sig);
func_sig->func = func;
list_add(&func_sig->node, func_list);
_mesa_hash_table_insert(func_lookup, func->name, func_list);
}
}
for (unsigned i = 0; i < num_shaders; i++) {
/* Skip shader object with main function as we have already cloned the
* full shader.
*/
if (main == shader_list[i])
continue;
/* Before cloning the shader check the lookup table to see if globals
* have already been seen in a previous shader, if so update the remap
* table.
*/
nir_foreach_variable_in_shader(var, shader_list[i]->nir) {
struct hash_entry *e =
_mesa_hash_table_search(var_lookup, var->name);
if (e) {
_mesa_hash_table_insert(remap_table, var, e->data);
nir_variable *m_var = (nir_variable *) e->data;
if (glsl_type_is_array(var->type)) {
/* It is possible to have a global array declared in multiple
* shaders without a size. The array is implicitly sized by
* the maximal access to it in *any* shader. Because of this,
* we need to track the maximal access to the array as linking
* pulls more functions in that access the array.
*/
m_var->data.max_array_access =
MAX2(var->data.max_array_access,
m_var->data.max_array_access);
if (glsl_array_size(m_var->type) == 0 &&
glsl_array_size(var->type) != 0)
m_var->type = var->type;
}
if (glsl_without_array(var->type) == var->interface_type) {
/* Similarly, we need implicit sizes of arrays within interface
* blocks to be sized by the maximal access in *any* shader.
*/
int *linked_max_ifc_array_access = m_var->max_ifc_array_access;
int *ir_max_ifc_array_access = var->max_ifc_array_access;
assert(linked_max_ifc_array_access != NULL);
assert(ir_max_ifc_array_access != NULL);
for (unsigned j = 0; j < var->interface_type->length; j++) {
linked_max_ifc_array_access[j] =
MAX2(linked_max_ifc_array_access[j],
ir_max_ifc_array_access[j]);
}
}
} else {
nir_variable *nvar =
nir_variable_clone(var, linked_sh->Program->nir);
_mesa_hash_table_insert(remap_table, var, nvar);
nir_shader_add_variable(linked_sh->Program->nir, nvar);
_mesa_hash_table_insert(var_lookup, var->name, nvar);
}
}
/* Clone functions into our combined shader */
nir_foreach_function(func, shader_list[i]->nir) {
nir_function *f = NULL;
/* Try to find the signature in one of the shaders that is being
* linked. If not found clone the function.
*/
struct hash_entry *e = _mesa_hash_table_search(func_lookup, func->name);
if (e) {
struct list_head *f_list = (struct list_head *) e->data;
f = find_matching_signature(f_list, func->params,
func->num_params,
false,
false);
if (!f) {
struct function_sig *func_sig = ralloc(mem_ctx, struct function_sig);
f = clone_function(remap_table, func, linked_sh->Program->nir);
func_sig->func = f;
if (func->impl)
list_add(&func_sig->node, f_list);
} else {
_mesa_hash_table_insert(remap_table, func, f);
}
} else {
struct list_head *func_list = ralloc(mem_ctx, struct list_head);
list_inithead(func_list);
struct function_sig *func_sig = ralloc(mem_ctx, struct function_sig);
f = clone_function(remap_table, func, linked_sh->Program->nir);
func_sig->func = f;
if (func->impl)
list_add(&func_sig->node, func_list);
_mesa_hash_table_insert(func_lookup, func->name, func_list);
}
}
/* Now that all functions are cloned we can clone any function
* implementations. We can't do this in the previous loop above because
* glsl to nir places function declarations next to implementations i.e.
* we have lost any predeclared function signatures so we won't always
* find them in the remap table until they have all been processed.
*/
nir_foreach_function(func, shader_list[i]->nir) {
if (func->impl) {
nir_function_impl *f_impl =
nir_function_impl_clone_remap_globals(linked_sh->Program->nir,
func->impl, remap_table);
struct hash_entry *e =
_mesa_hash_table_search(remap_table, func);
assert(e);
nir_function *f = (nir_function *) e->data;
assert(!f->impl);
nir_function_set_impl(f, f_impl);
}
}
}
/* Now that all shaders have been combined together make sure all function
* calls can be resolved.
*/
nir_foreach_function_impl(impl, linked_sh->Program->nir) {
nir_foreach_block(block, impl) {
nir_foreach_instr(instr, block) {
if (instr->type == nir_instr_type_call) {
nir_call_instr *call = nir_instr_as_call(instr);
/* If this was already set at compile time don't try to set it
* again.
*/
if (call->callee->impl)
continue;
struct hash_entry *e = _mesa_hash_table_search(func_lookup,
call->callee->name);
if (e) {
struct list_head *f_list = (struct list_head *) e->data;
nir_function *f =
find_matching_signature(f_list, call->callee->params,
call->callee->num_params,
main->has_implicit_conversions,
main->has_implicit_int_to_uint_conversion);
if (f)
call->callee = f;
}
if (!call->callee->impl) {
linker_error(prog, "unresolved reference to function `%s'\n",
call->callee->name);
ralloc_free(mem_ctx);
return false;
}
}
}
}
}
/**
* Link all out variables on a single stage which are not
* directly used in a shader with the main function.
*/
if (linked_sh->Stage != MESA_SHADER_FRAGMENT) {
for (unsigned i = 0; i < num_shaders; i++) {
/* Skip shader object with main function as we have already cloned
* the full shader, including shader outputs.
*/
if (main == shader_list[i])
continue;
nir_foreach_shader_out_variable(var, shader_list[i]->nir) {
struct hash_entry *e =
_mesa_hash_table_search(var_lookup, var->name);
if (e)
continue;
nir_variable *nvar = nir_variable_clone(var, linked_sh->Program->nir);
nir_shader_add_variable(linked_sh->Program->nir, nvar);
_mesa_hash_table_insert(var_lookup, var->name, var);
}
}
}
/* Call fixup deref types as we may have set array sizes above */
nir_fixup_deref_types(linked_sh->Program->nir);
ralloc_free(mem_ctx);
return true;
}