Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 1 | /********************************************************** |
| 2 | * Copyright 2008-2009 VMware, Inc. All rights reserved. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person |
| 5 | * obtaining a copy of this software and associated documentation |
| 6 | * files (the "Software"), to deal in the Software without |
| 7 | * restriction, including without limitation the rights to use, copy, |
| 8 | * modify, merge, publish, distribute, sublicense, and/or sell copies |
| 9 | * of the Software, and to permit persons to whom the Software is |
| 10 | * furnished to do so, subject to the following conditions: |
| 11 | * |
| 12 | * The above copyright notice and this permission notice shall be |
| 13 | * included in all copies or substantial portions of the Software. |
| 14 | * |
| 15 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, |
| 16 | * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
| 17 | * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND |
| 18 | * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS |
| 19 | * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN |
| 20 | * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN |
| 21 | * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| 22 | * SOFTWARE. |
| 23 | * |
| 24 | **********************************************************/ |
| 25 | |
| 26 | |
| 27 | #include "pipe/p_compiler.h" |
| 28 | #include "pipe/p_shader_tokens.h" |
| 29 | #include "pipe/p_defines.h" |
| 30 | #include "tgsi/tgsi_parse.h" |
| 31 | #include "tgsi/tgsi_dump.h" |
| 32 | #include "tgsi/tgsi_scan.h" |
Brian Paul | 58ea42b | 2011-11-03 17:40:56 -0600 | [diff] [blame] | 33 | #include "util/u_math.h" |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 34 | #include "util/u_memory.h" |
José Fonseca | cdb445f | 2010-01-03 00:47:30 +0000 | [diff] [blame] | 35 | #include "util/u_bitmask.h" |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 36 | |
José Fonseca | 178407f | 2009-11-24 14:37:45 +0000 | [diff] [blame] | 37 | #include "svgadump/svga_shader_dump.h" |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 38 | |
| 39 | #include "svga_context.h" |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 40 | #include "svga_shader.h" |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 41 | #include "svga_tgsi.h" |
| 42 | #include "svga_tgsi_emit.h" |
| 43 | #include "svga_debug.h" |
| 44 | |
| 45 | #include "svga_hw_reg.h" |
| 46 | #include "svga3d_shaderdefs.h" |
| 47 | |
| 48 | |
| 49 | /* Sinkhole used only in error conditions. |
| 50 | */ |
| 51 | static char err_buf[128]; |
| 52 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 53 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 54 | static boolean |
| 55 | svga_shader_expand(struct svga_shader_emitter *emit) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 56 | { |
| 57 | char *new_buf; |
| 58 | unsigned newsize = emit->size * 2; |
| 59 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 60 | if (emit->buf != err_buf) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 61 | new_buf = REALLOC(emit->buf, emit->size, newsize); |
| 62 | else |
| 63 | new_buf = NULL; |
| 64 | |
Edward O'Callaghan | 13eb5f5 | 2015-12-04 22:08:22 +1100 | [diff] [blame] | 65 | if (!new_buf) { |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 66 | emit->ptr = err_buf; |
| 67 | emit->buf = err_buf; |
| 68 | emit->size = sizeof(err_buf); |
| 69 | return FALSE; |
| 70 | } |
| 71 | |
| 72 | emit->size = newsize; |
| 73 | emit->ptr = new_buf + (emit->ptr - emit->buf); |
| 74 | emit->buf = new_buf; |
| 75 | return TRUE; |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 76 | } |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 77 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 78 | |
Ilia Mirkin | a2a1a58 | 2015-07-20 19:58:43 -0400 | [diff] [blame] | 79 | static inline boolean |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 80 | reserve(struct svga_shader_emitter *emit, unsigned nr_dwords) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 81 | { |
| 82 | if (emit->ptr - emit->buf + nr_dwords * sizeof(unsigned) >= emit->size) { |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 83 | if (!svga_shader_expand(emit)) { |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 84 | return FALSE; |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 85 | } |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 86 | } |
| 87 | |
| 88 | return TRUE; |
| 89 | } |
| 90 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 91 | |
| 92 | boolean |
| 93 | svga_shader_emit_dword(struct svga_shader_emitter * emit, unsigned dword) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 94 | { |
| 95 | if (!reserve(emit, 1)) |
| 96 | return FALSE; |
| 97 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 98 | *(unsigned *) emit->ptr = dword; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 99 | emit->ptr += sizeof dword; |
| 100 | return TRUE; |
| 101 | } |
| 102 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 103 | |
| 104 | boolean |
| 105 | svga_shader_emit_dwords(struct svga_shader_emitter * emit, |
| 106 | const unsigned *dwords, unsigned nr) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 107 | { |
| 108 | if (!reserve(emit, nr)) |
| 109 | return FALSE; |
| 110 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 111 | memcpy(emit->ptr, dwords, nr * sizeof *dwords); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 112 | emit->ptr += nr * sizeof *dwords; |
| 113 | return TRUE; |
| 114 | } |
| 115 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 116 | |
| 117 | boolean |
| 118 | svga_shader_emit_opcode(struct svga_shader_emitter * emit, unsigned opcode) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 119 | { |
| 120 | SVGA3dShaderInstToken *here; |
| 121 | |
| 122 | if (!reserve(emit, 1)) |
| 123 | return FALSE; |
| 124 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 125 | here = (SVGA3dShaderInstToken *) emit->ptr; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 126 | here->value = opcode; |
| 127 | |
| 128 | if (emit->insn_offset) { |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 129 | SVGA3dShaderInstToken *prev = |
| 130 | (SVGA3dShaderInstToken *) (emit->buf + emit->insn_offset); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 131 | prev->size = (here - prev) - 1; |
| 132 | } |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 133 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 134 | emit->insn_offset = emit->ptr - emit->buf; |
| 135 | emit->ptr += sizeof(unsigned); |
| 136 | return TRUE; |
| 137 | } |
| 138 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 139 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 140 | static boolean |
| 141 | svga_shader_emit_header(struct svga_shader_emitter *emit) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 142 | { |
| 143 | SVGA3dShaderVersion header; |
| 144 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 145 | memset(&header, 0, sizeof header); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 146 | |
| 147 | switch (emit->unit) { |
| 148 | case PIPE_SHADER_FRAGMENT: |
Brian Paul | 94b219b | 2011-10-11 09:30:09 -0600 | [diff] [blame] | 149 | header.value = SVGA3D_PS_30; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 150 | break; |
| 151 | case PIPE_SHADER_VERTEX: |
Brian Paul | 94b219b | 2011-10-11 09:30:09 -0600 | [diff] [blame] | 152 | header.value = SVGA3D_VS_30; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 153 | break; |
| 154 | } |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 155 | |
| 156 | return svga_shader_emit_dword(emit, header.value); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 157 | } |
| 158 | |
| 159 | |
Brian Paul | 58ea42b | 2011-11-03 17:40:56 -0600 | [diff] [blame] | 160 | /** |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 161 | * Parse TGSI shader and translate to SVGA/DX9 serialized |
| 162 | * representation. |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 163 | * |
| 164 | * In this function SVGA shader is emitted to an in-memory buffer that |
| 165 | * can be dynamically grown. Once we've finished and know how large |
| 166 | * it is, it will be copied to a hardware buffer for upload. |
| 167 | */ |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 168 | struct svga_shader_variant * |
Brian Paul | 8d0d5dc | 2015-10-08 21:03:27 -0600 | [diff] [blame] | 169 | svga_tgsi_vgpu9_translate(struct svga_context *svga, |
| 170 | const struct svga_shader *shader, |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 171 | const struct svga_compile_key *key, unsigned unit) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 172 | { |
Brian Paul | 2a30379 | 2014-01-18 03:45:41 -0800 | [diff] [blame] | 173 | struct svga_shader_variant *variant = NULL; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 174 | struct svga_shader_emitter emit; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 175 | |
Charmaine Lee | 2e1cfcc | 2016-08-19 08:49:17 -0600 | [diff] [blame] | 176 | SVGA_STATS_TIME_PUSH(svga_sws(svga), SVGA_STATS_TIME_TGSIVGPU9TRANSLATE); |
| 177 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 178 | memset(&emit, 0, sizeof(emit)); |
| 179 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 180 | emit.size = 1024; |
| 181 | emit.buf = MALLOC(emit.size); |
| 182 | if (emit.buf == NULL) { |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 183 | goto fail; |
| 184 | } |
| 185 | |
| 186 | emit.ptr = emit.buf; |
| 187 | emit.unit = unit; |
Brian Paul | ba49798 | 2013-06-28 08:09:48 -0600 | [diff] [blame] | 188 | emit.key = *key; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 189 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 190 | tgsi_scan_shader(shader->tokens, &emit.info); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 191 | |
| 192 | emit.imm_start = emit.info.file_max[TGSI_FILE_CONSTANT] + 1; |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 193 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 194 | if (unit == PIPE_SHADER_FRAGMENT) |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 195 | emit.imm_start += key->num_unnormalized_coords; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 196 | |
| 197 | if (unit == PIPE_SHADER_VERTEX) { |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 198 | emit.imm_start += key->vs.need_prescale ? 2 : 0; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 199 | } |
| 200 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 201 | emit.nr_hw_float_const = |
| 202 | (emit.imm_start + emit.info.file_max[TGSI_FILE_IMMEDIATE] + 1); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 203 | |
| 204 | emit.nr_hw_temp = emit.info.file_max[TGSI_FILE_TEMPORARY] + 1; |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 205 | |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 206 | if (emit.nr_hw_temp >= SVGA3D_TEMPREG_MAX) { |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 207 | debug_printf("svga: too many temporary registers (%u)\n", |
| 208 | emit.nr_hw_temp); |
Brian Paul | f12f67c | 2011-11-17 16:36:26 -0700 | [diff] [blame] | 209 | goto fail; |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 210 | } |
Brian Paul | f12f67c | 2011-11-17 16:36:26 -0700 | [diff] [blame] | 211 | |
Charmaine Lee | 57d9222 | 2017-08-01 18:02:57 -0700 | [diff] [blame] | 212 | if (emit.info.indirect_files & (1 << TGSI_FILE_TEMPORARY)) { |
| 213 | debug_printf( |
| 214 | "svga: indirect indexing of temporary registers is not supported.\n"); |
| 215 | goto fail; |
| 216 | } |
| 217 | |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 218 | emit.in_main_func = TRUE; |
| 219 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 220 | if (!svga_shader_emit_header(&emit)) { |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 221 | debug_printf("svga: emit header failed\n"); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 222 | goto fail; |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 223 | } |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 224 | |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 225 | if (!svga_shader_emit_instructions(&emit, shader->tokens)) { |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 226 | debug_printf("svga: emit instructions failed\n"); |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 227 | goto fail; |
Brian Paul | 9b3d87b | 2012-06-29 16:53:35 -0600 | [diff] [blame] | 228 | } |
| 229 | |
Brian Paul | f413f1a | 2015-10-08 21:06:18 -0600 | [diff] [blame] | 230 | variant = svga_new_shader_variant(svga); |
Edward O'Callaghan | 13eb5f5 | 2015-12-04 22:08:22 +1100 | [diff] [blame] | 231 | if (!variant) |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 232 | goto fail; |
| 233 | |
Brian Paul | 2a30379 | 2014-01-18 03:45:41 -0800 | [diff] [blame] | 234 | variant->shader = shader; |
| 235 | variant->tokens = (const unsigned *) emit.buf; |
| 236 | variant->nr_tokens = (emit.ptr - emit.buf) / sizeof(unsigned); |
| 237 | memcpy(&variant->key, key, sizeof(*key)); |
| 238 | variant->id = UTIL_BITMASK_INVALID_INDEX; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 239 | |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 240 | variant->pstipple_sampler_unit = emit.pstipple_sampler_unit; |
| 241 | |
Brian Paul | 1082735 | 2015-10-22 15:36:25 -0600 | [diff] [blame] | 242 | /* If there was exactly one write to a fragment shader output register |
| 243 | * and it came from a constant buffer, we know all fragments will have |
| 244 | * the same color (except for blending). |
| 245 | */ |
| 246 | variant->constant_color_output = |
| 247 | emit.constant_color_output && emit.num_output_writes == 1; |
| 248 | |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 249 | #if 0 |
| 250 | if (!svga_shader_verify(variant->tokens, variant->nr_tokens) || |
| 251 | SVGA_DEBUG & DEBUG_TGSI) { |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 252 | debug_printf("#####################################\n"); |
| 253 | debug_printf("Shader %u below\n", shader->id); |
| 254 | tgsi_dump(shader->tokens, 0); |
José Fonseca | 6dd9676 | 2009-11-27 13:59:37 +0000 | [diff] [blame] | 255 | if (SVGA_DEBUG & DEBUG_TGSI) { |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 256 | debug_printf("Shader %u compiled below\n", shader->id); |
Brian Paul | 2a30379 | 2014-01-18 03:45:41 -0800 | [diff] [blame] | 257 | svga_shader_dump(variant->tokens, variant->nr_tokens, FALSE); |
José Fonseca | 6dd9676 | 2009-11-27 13:59:37 +0000 | [diff] [blame] | 258 | } |
Brian Paul | 2e8c51c | 2013-06-19 10:39:43 -0600 | [diff] [blame] | 259 | debug_printf("#####################################\n"); |
José Fonseca | 6dd9676 | 2009-11-27 13:59:37 +0000 | [diff] [blame] | 260 | } |
Brian Paul | e054251 | 2015-08-13 11:00:58 -0700 | [diff] [blame] | 261 | #endif |
José Fonseca | 6dd9676 | 2009-11-27 13:59:37 +0000 | [diff] [blame] | 262 | |
Charmaine Lee | 2e1cfcc | 2016-08-19 08:49:17 -0600 | [diff] [blame] | 263 | goto done; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 264 | |
Charmaine Lee | 2e1cfcc | 2016-08-19 08:49:17 -0600 | [diff] [blame] | 265 | fail: |
Brian Paul | 2a30379 | 2014-01-18 03:45:41 -0800 | [diff] [blame] | 266 | FREE(variant); |
Brian Paul | 96e0894 | 2016-03-29 13:34:36 -0600 | [diff] [blame] | 267 | if (emit.buf != err_buf) |
| 268 | FREE(emit.buf); |
Charmaine Lee | 2e1cfcc | 2016-08-19 08:49:17 -0600 | [diff] [blame] | 269 | variant = NULL; |
| 270 | |
| 271 | done: |
| 272 | SVGA_STATS_TIME_POP(svga_sws(svga)); |
| 273 | return variant; |
Jakob Bornecrantz | 3192633 | 2009-11-16 19:56:18 +0100 | [diff] [blame] | 274 | } |