| /* |
| * Copyright © Microsoft Corporation |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a |
| * copy of this software and associated documentation files (the "Software"), |
| * to deal in the Software without restriction, including without limitation |
| * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| * and/or sell copies of the Software, and to permit persons to whom the |
| * Software is furnished to do so, subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice (including the next |
| * paragraph) shall be included in all copies or substantial portions of the |
| * Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING |
| * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS |
| * IN THE SOFTWARE. |
| */ |
| |
| #include "nir/nir.h" |
| #include "nir/nir_serialize.h" |
| #include "glsl_types.h" |
| #include "nir_types.h" |
| #include "clc.h" |
| #include "clc_helpers.h" |
| #include "spirv/nir_spirv.h" |
| #include "util/u_debug.h" |
| |
| #include <stdlib.h> |
| |
| enum clc_debug_flags { |
| CLC_DEBUG_DUMP_SPIRV = 1 << 0, |
| CLC_DEBUG_VERBOSE = 1 << 1, |
| }; |
| |
| static const struct debug_named_value clc_debug_options[] = { |
| { "dump_spirv", CLC_DEBUG_DUMP_SPIRV, "Dump spirv blobs" }, |
| { "verbose", CLC_DEBUG_VERBOSE, NULL }, |
| DEBUG_NAMED_VALUE_END |
| }; |
| |
| DEBUG_GET_ONCE_FLAGS_OPTION(debug_clc, "CLC_DEBUG", clc_debug_options, 0) |
| |
| static void |
| clc_print_kernels_info(const struct clc_parsed_spirv *obj) |
| { |
| fprintf(stdout, "Kernels:\n"); |
| for (unsigned i = 0; i < obj->num_kernels; i++) { |
| const struct clc_kernel_arg *args = obj->kernels[i].args; |
| bool first = true; |
| |
| fprintf(stdout, "\tvoid %s(", obj->kernels[i].name); |
| for (unsigned j = 0; j < obj->kernels[i].num_args; j++) { |
| if (!first) |
| fprintf(stdout, ", "); |
| else |
| first = false; |
| |
| switch (args[j].address_qualifier) { |
| case CLC_KERNEL_ARG_ADDRESS_GLOBAL: |
| fprintf(stdout, "__global "); |
| break; |
| case CLC_KERNEL_ARG_ADDRESS_LOCAL: |
| fprintf(stdout, "__local "); |
| break; |
| case CLC_KERNEL_ARG_ADDRESS_CONSTANT: |
| fprintf(stdout, "__constant "); |
| break; |
| default: |
| break; |
| } |
| |
| if (args[j].type_qualifier & CLC_KERNEL_ARG_TYPE_VOLATILE) |
| fprintf(stdout, "volatile "); |
| if (args[j].type_qualifier & CLC_KERNEL_ARG_TYPE_CONST) |
| fprintf(stdout, "const "); |
| if (args[j].type_qualifier & CLC_KERNEL_ARG_TYPE_RESTRICT) |
| fprintf(stdout, "restrict "); |
| |
| fprintf(stdout, "%s %s", args[j].type_name, args[j].name); |
| } |
| fprintf(stdout, ");\n"); |
| } |
| } |
| |
| static void |
| clc_libclc_optimize(nir_shader *s) |
| { |
| bool progress; |
| do { |
| progress = false; |
| NIR_PASS(progress, s, nir_split_var_copies); |
| NIR_PASS(progress, s, nir_opt_copy_prop_vars); |
| NIR_PASS(progress, s, nir_lower_var_copies); |
| NIR_PASS(progress, s, nir_lower_vars_to_ssa); |
| NIR_PASS(progress, s, nir_copy_prop); |
| NIR_PASS(progress, s, nir_opt_remove_phis); |
| NIR_PASS(progress, s, nir_opt_dce); |
| NIR_PASS(progress, s, nir_opt_if, nir_opt_if_aggressive_last_continue | nir_opt_if_optimize_phi_true_false); |
| NIR_PASS(progress, s, nir_opt_dead_cf); |
| NIR_PASS(progress, s, nir_opt_cse); |
| NIR_PASS(progress, s, nir_opt_peephole_select, 8, true, true); |
| NIR_PASS(progress, s, nir_opt_algebraic); |
| NIR_PASS(progress, s, nir_opt_constant_folding); |
| NIR_PASS(progress, s, nir_opt_undef); |
| NIR_PASS(progress, s, nir_lower_undef_to_zero); |
| NIR_PASS(progress, s, nir_opt_deref); |
| } while (progress); |
| } |
| |
| struct clc_libclc { |
| const nir_shader *libclc_nir; |
| }; |
| |
| struct clc_libclc * |
| clc_libclc_new(const struct clc_logger *logger, const struct clc_libclc_options *options) |
| { |
| struct clc_libclc *ctx = rzalloc(NULL, struct clc_libclc); |
| if (!ctx) { |
| clc_error(logger, "D3D12: failed to allocate a clc_libclc"); |
| return NULL; |
| } |
| |
| const struct spirv_to_nir_options libclc_spirv_options = { |
| .environment = NIR_SPIRV_OPENCL, |
| .create_library = true, |
| .constant_addr_format = nir_address_format_32bit_index_offset_pack64, |
| .global_addr_format = nir_address_format_32bit_index_offset_pack64, |
| .shared_addr_format = nir_address_format_32bit_offset_as_64bit, |
| .temp_addr_format = nir_address_format_32bit_offset_as_64bit, |
| .float_controls_execution_mode = FLOAT_CONTROLS_DENORM_FLUSH_TO_ZERO_FP32, |
| .caps = { |
| .address = true, |
| .float64 = true, |
| .int8 = true, |
| .int16 = true, |
| .int64 = true, |
| .kernel = true, |
| }, |
| }; |
| |
| glsl_type_singleton_init_or_ref(); |
| nir_shader *s = nir_load_libclc_shader(64, NULL, &libclc_spirv_options, options->nir_options); |
| if (!s) { |
| clc_error(logger, "D3D12: spirv_to_nir failed on libclc blob"); |
| ralloc_free(ctx); |
| return NULL; |
| } |
| |
| if (options && options->optimize) |
| clc_libclc_optimize(s); |
| |
| ralloc_steal(ctx, s); |
| ctx->libclc_nir = s; |
| |
| return ctx; |
| } |
| |
| void clc_free_libclc(struct clc_libclc *ctx) |
| { |
| ralloc_free(ctx); |
| glsl_type_singleton_decref(); |
| } |
| |
| const nir_shader *clc_libclc_get_clc_shader(struct clc_libclc *ctx) |
| { |
| return ctx->libclc_nir; |
| } |
| |
| void clc_libclc_serialize(struct clc_libclc *context, |
| void **serialized, |
| size_t *serialized_size) |
| { |
| struct blob tmp; |
| blob_init(&tmp); |
| nir_serialize(&tmp, context->libclc_nir, true); |
| |
| blob_finish_get_buffer(&tmp, serialized, serialized_size); |
| } |
| |
| void clc_libclc_free_serialized(void *serialized) |
| { |
| free(serialized); |
| } |
| |
| struct clc_libclc * |
| clc_libclc_deserialize(const void *serialized, size_t serialized_size) |
| { |
| struct clc_libclc *ctx = rzalloc(NULL, struct clc_libclc); |
| if (!ctx) { |
| return NULL; |
| } |
| |
| glsl_type_singleton_init_or_ref(); |
| |
| struct blob_reader tmp; |
| blob_reader_init(&tmp, serialized, serialized_size); |
| |
| nir_shader *s = nir_deserialize(NULL, NULL, &tmp); |
| if (!s) { |
| ralloc_free(ctx); |
| return NULL; |
| } |
| |
| ralloc_steal(ctx, s); |
| ctx->libclc_nir = s; |
| |
| return ctx; |
| } |
| |
| bool |
| clc_compile_c_to_spir(const struct clc_compile_args *args, |
| const struct clc_logger *logger, |
| struct clc_binary *out_spir) |
| { |
| return clc_c_to_spir(args, logger, out_spir) >= 0; |
| } |
| |
| void |
| clc_free_spir(struct clc_binary *spir) |
| { |
| clc_free_spir_binary(spir); |
| } |
| |
| bool |
| clc_compile_spir_to_spirv(const struct clc_binary *in_spir, |
| const struct clc_logger *logger, |
| struct clc_binary *out_spirv) |
| { |
| if (clc_spir_to_spirv(in_spir, logger, out_spirv) < 0) |
| return false; |
| |
| if (debug_get_option_debug_clc() & CLC_DEBUG_DUMP_SPIRV) |
| clc_dump_spirv(out_spirv, stdout); |
| |
| return true; |
| } |
| |
| void |
| clc_free_spirv(struct clc_binary *spirv) |
| { |
| clc_free_spirv_binary(spirv); |
| } |
| |
| bool |
| clc_compile_c_to_spirv(const struct clc_compile_args *args, |
| const struct clc_logger *logger, |
| struct clc_binary *out_spirv) |
| { |
| if (clc_c_to_spirv(args, logger, out_spirv) < 0) |
| return false; |
| |
| if (debug_get_option_debug_clc() & CLC_DEBUG_DUMP_SPIRV) |
| clc_dump_spirv(out_spirv, stdout); |
| |
| return true; |
| } |
| |
| bool |
| clc_link_spirv(const struct clc_linker_args *args, |
| const struct clc_logger *logger, |
| struct clc_binary *out_spirv) |
| { |
| if (clc_link_spirv_binaries(args, logger, out_spirv) < 0) |
| return false; |
| |
| if (debug_get_option_debug_clc() & CLC_DEBUG_DUMP_SPIRV) |
| clc_dump_spirv(out_spirv, stdout); |
| |
| return true; |
| } |
| |
| bool |
| clc_parse_spirv(const struct clc_binary *in_spirv, |
| const struct clc_logger *logger, |
| struct clc_parsed_spirv *out_data) |
| { |
| if (!clc_spirv_get_kernels_info(in_spirv, |
| &out_data->kernels, |
| &out_data->num_kernels, |
| &out_data->spec_constants, |
| &out_data->num_spec_constants, |
| logger)) |
| return false; |
| |
| if (debug_get_option_debug_clc() & CLC_DEBUG_VERBOSE) |
| clc_print_kernels_info(out_data); |
| |
| return true; |
| } |
| |
| void clc_free_parsed_spirv(struct clc_parsed_spirv *data) |
| { |
| clc_free_kernels_info(data->kernels, data->num_kernels); |
| } |
| |
| bool |
| clc_specialize_spirv(const struct clc_binary *in_spirv, |
| const struct clc_parsed_spirv *parsed_data, |
| const struct clc_spirv_specialization_consts *consts, |
| struct clc_binary *out_spirv) |
| { |
| if (!clc_spirv_specialize(in_spirv, parsed_data, consts, out_spirv)) |
| return false; |
| |
| if (debug_get_option_debug_clc() & CLC_DEBUG_DUMP_SPIRV) |
| clc_dump_spirv(out_spirv, stdout); |
| |
| return true; |
| } |