1 /*
2  * Copyright (C) 2018-2019 Alyssa Rosenzweig <alyssa@rosenzweig.io>
3  * Copyright (C) 2019-2020 Collabora, Ltd.
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the next
13  * paragraph) shall be included in all copies or substantial portions of the
14  * Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  */
24 
25 #ifndef __MIDGARD_H_
26 #define __MIDGARD_H_
27 
28 #include "compiler/nir/nir.h"
29 #include "util/u_dynarray.h"
30 #include "panfrost/util/pan_ir.h"
31 
32 panfrost_program *
33 midgard_compile_shader_nir(void *mem_ctx, nir_shader *nir,
34                            const struct panfrost_compile_inputs *inputs);
35 
36 /* NIR options are shared between the standalone compiler and the online
37  * compiler. Defining it here is the simplest, though maybe not the Right
38  * solution. */
39 
40 static const nir_shader_compiler_options midgard_nir_options = {
41         .lower_ffma16 = true,
42         .lower_ffma32 = true,
43         .lower_ffma64 = true,
44         .lower_scmp = true,
45         .lower_flrp16 = true,
46         .lower_flrp32 = true,
47         .lower_flrp64 = true,
48         .lower_ffract = true,
49         .lower_fmod = true,
50         .lower_fdiv = true,
51         .lower_isign = true,
52         .lower_fpow = true,
53         .lower_find_lsb = true,
54         .lower_fdph = true,
55 
56         .lower_wpos_pntc = true,
57 
58         /* TODO: We have native ops to help here, which we'll want to look into
59          * eventually */
60         .lower_fsign = true,
61 
62         .lower_extract_byte = true,
63         .lower_extract_word = true,
64         .lower_rotate = true,
65 
66         .lower_pack_half_2x16 = true,
67         .lower_pack_unorm_2x16 = true,
68         .lower_pack_snorm_2x16 = true,
69         .lower_pack_unorm_4x8 = true,
70         .lower_pack_snorm_4x8 = true,
71         .lower_unpack_half_2x16 = true,
72         .lower_unpack_unorm_2x16 = true,
73         .lower_unpack_snorm_2x16 = true,
74         .lower_unpack_unorm_4x8 = true,
75         .lower_unpack_snorm_4x8 = true,
76         .lower_pack_split = true,
77 
78         .lower_doubles_options = nir_lower_dmod,
79 
80         .lower_bitfield_extract_to_shifts = true,
81         .vectorize_io = true,
82         .use_interpolated_input_intrinsics = true
83 };
84 
85 #endif
86