blob: 1e1fbb099c67e7ba69b5df2f6758f9c79ee50962 [file] [log] [blame]
/**********************************************************
* Copyright 2008-2009 VMware, Inc. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
* files (the "Software"), to deal in the Software without
* restriction, including without limitation the rights to use, copy,
* modify, merge, publish, distribute, sublicense, and/or sell copies
* of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*
**********************************************************/
#include "util/u_inlines.h"
#include "util/u_memory.h"
#include "pipe/p_defines.h"
#include "svga_screen.h"
#include "svga_context.h"
#include "svga_state.h"
#include "svga_cmd.h"
#include "svga_tgsi.h"
#include "svga_debug.h"
#include "svga_resource_buffer.h"
#include "svga_hw_reg.h"
/*
* Don't try to send more than 4kb of successive constants.
*/
#define MAX_CONST_REG_COUNT 256 /**< number of float[4] constants */
/**
* Extra space for svga-specific VS/PS constants (such as texcoord
* scale factors, vertex transformation scale/translation).
*/
#define MAX_EXTRA_CONSTS 32
/** Guest-backed surface constant buffers must be this size */
#define GB_CONSTBUF_SIZE (SVGA3D_CONSTREG_MAX)
/**
* Convert from PIPE_SHADER_* to SVGA3D_SHADERTYPE_*
*/
static unsigned
svga_shader_type(unsigned shader)
{
switch (shader) {
case PIPE_SHADER_VERTEX:
return SVGA3D_SHADERTYPE_VS;
case PIPE_SHADER_FRAGMENT:
return SVGA3D_SHADERTYPE_PS;
default:
assert(!"Unexpected shader type");
return SVGA3D_SHADERTYPE_VS;
}
}
/**
* Emit any extra fragment shader constants into the buffer pointed
* to by 'dest'.
* In particular, these would be the scaling factors needed for handling
* unnormalized texture coordinates for texture rectangles.
* \return number of float[4] constants put into the dest buffer
*/
static unsigned
svga_get_extra_fs_constants(struct svga_context *svga, float *dest)
{
const struct svga_shader_variant *variant = svga->state.hw_draw.fs;
const struct svga_fs_compile_key *key = &variant->key.fkey;
unsigned count = 0;
/* SVGA_NEW_VS_VARIANT
*/
if (key->num_unnormalized_coords) {
unsigned i;
for (i = 0; i < key->num_textures; i++) {
if (key->tex[i].unnormalized) {
struct pipe_resource *tex = svga->curr.sampler_views[i]->texture;
/* debug/sanity check */
assert(key->tex[i].width_height_idx == count);
*dest++ = 1.0 / (float)tex->width0;
*dest++ = 1.0 / (float)tex->height0;
*dest++ = 1.0;
*dest++ = 1.0;
count++;
}
}
}
assert(count <= MAX_EXTRA_CONSTS);
return count;
}
/**
* Emit any extra vertex shader constants into the buffer pointed
* to by 'dest'.
* In particular, these would be the scale and bias factors computed
* from the framebuffer size which are used to copy with differences in
* GL vs D3D coordinate spaces. See svga_tgsi_insn.c for more info.
* \return number of float[4] constants put into the dest buffer
*/
static unsigned
svga_get_extra_vs_constants(struct svga_context *svga, float *dest)
{
const struct svga_shader_variant *variant = svga->state.hw_draw.vs;
const struct svga_vs_compile_key *key = &variant->key.vkey;
unsigned count = 0;
/* SVGA_NEW_VS_VARIANT
*/
if (key->need_prescale) {
memcpy(dest, svga->state.hw_clear.prescale.scale, 4 * sizeof(float));
dest += 4;
memcpy(dest, svga->state.hw_clear.prescale.translate, 4 * sizeof(float));
dest += 4;
count = 2;
}
assert(count <= MAX_EXTRA_CONSTS);
return count;
}
/**
* Check and emit one shader constant register.
* \param shader PIPE_SHADER_FRAGMENT or PIPE_SHADER_VERTEX
* \param i which float[4] constant to change
* \param value the new float[4] value
*/
static enum pipe_error
emit_const(struct svga_context *svga, unsigned shader, unsigned i,
const float *value)
{
enum pipe_error ret = PIPE_OK;
assert(shader < PIPE_SHADER_TYPES);
assert(i < SVGA3D_CONSTREG_MAX);
if (memcmp(svga->state.hw_draw.cb[shader][i], value,
4 * sizeof(float)) != 0) {
if (SVGA_DEBUG & DEBUG_CONSTS)
debug_printf("%s %s %u: %f %f %f %f\n",
__FUNCTION__,
shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
i,
value[0],
value[1],
value[2],
value[3]);
ret = SVGA3D_SetShaderConst( svga->swc,
i,
svga_shader_type(shader),
SVGA3D_CONST_TYPE_FLOAT,
value );
if (ret != PIPE_OK)
return ret;
memcpy(svga->state.hw_draw.cb[shader][i], value, 4 * sizeof(float));
}
return ret;
}
/*
* Check and emit a range of shader constant registers, trying to coalesce
* successive shader constant updates in a single command in order to save
* space on the command buffer. This is a HWv8 feature.
*/
static enum pipe_error
emit_const_range(struct svga_context *svga,
unsigned shader,
unsigned offset,
unsigned count,
const float (*values)[4])
{
unsigned i, j;
enum pipe_error ret;
#ifdef DEBUG
if (offset + count > SVGA3D_CONSTREG_MAX) {
debug_printf("svga: too many constants (offset %u + count %u = %u (max = %u))\n",
offset, count, offset + count, SVGA3D_CONSTREG_MAX);
}
#endif
if (offset > SVGA3D_CONSTREG_MAX) {
/* This isn't OK, but if we propagate an error all the way up we'll
* just get into more trouble.
* XXX note that offset is always zero at this time so this is moot.
*/
return PIPE_OK;
}
if (offset + count > SVGA3D_CONSTREG_MAX) {
/* Just drop the extra constants for now.
* Ideally we should not have allowed the app to create a shader
* that exceeds our constant buffer size but there's no way to
* express that in gallium at this time.
*/
count = SVGA3D_CONSTREG_MAX - offset;
}
i = 0;
while (i < count) {
if (memcmp(svga->state.hw_draw.cb[shader][offset + i],
values[i],
4 * sizeof(float)) != 0) {
/* Found one dirty constant
*/
if (SVGA_DEBUG & DEBUG_CONSTS)
debug_printf("%s %s %d: %f %f %f %f\n",
__FUNCTION__,
shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
offset + i,
values[i][0],
values[i][1],
values[i][2],
values[i][3]);
/* Look for more consecutive dirty constants.
*/
j = i + 1;
while (j < count &&
j < i + MAX_CONST_REG_COUNT &&
memcmp(svga->state.hw_draw.cb[shader][offset + j],
values[j],
4 * sizeof(float)) != 0) {
if (SVGA_DEBUG & DEBUG_CONSTS)
debug_printf("%s %s %d: %f %f %f %f\n",
__FUNCTION__,
shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
offset + j,
values[j][0],
values[j][1],
values[j][2],
values[j][3]);
++j;
}
assert(j >= i + 1);
/* Send them all together.
*/
if (svga_have_gb_objects(svga)) {
ret = SVGA3D_SetGBShaderConstsInline(svga->swc,
offset + i, /* start */
j - i, /* count */
svga_shader_type(shader),
SVGA3D_CONST_TYPE_FLOAT,
values + i);
}
else {
ret = SVGA3D_SetShaderConsts(svga->swc,
offset + i, j - i,
svga_shader_type(shader),
SVGA3D_CONST_TYPE_FLOAT,
values + i);
}
if (ret != PIPE_OK) {
return ret;
}
/*
* Local copy of the hardware state.
*/
memcpy(svga->state.hw_draw.cb[shader][offset + i],
values[i],
(j - i) * 4 * sizeof(float));
i = j + 1;
} else {
++i;
}
}
return PIPE_OK;
}
/**
* Emit all the constants in a constant buffer for a shader stage.
*/
static enum pipe_error
emit_consts(struct svga_context *svga, unsigned shader)
{
struct svga_screen *ss = svga_screen(svga->pipe.screen);
struct pipe_transfer *transfer = NULL;
unsigned count;
const float (*data)[4] = NULL;
unsigned i;
enum pipe_error ret = PIPE_OK;
const unsigned offset = 0;
assert(shader < PIPE_SHADER_TYPES);
if (svga->curr.cbufs[shader].buffer == NULL)
goto done;
data = (const float (*)[4])pipe_buffer_map(&svga->pipe,
svga->curr.cbufs[shader].buffer,
PIPE_TRANSFER_READ,
&transfer);
if (data == NULL) {
ret = PIPE_ERROR_OUT_OF_MEMORY;
goto done;
}
/* sanity check */
assert(svga->curr.cbufs[shader].buffer->width0 >=
svga->curr.cbufs[shader].buffer_size);
/* Use/apply the constant buffer size and offsets here */
count = svga->curr.cbufs[shader].buffer_size / (4 * sizeof(float));
data += svga->curr.cbufs[shader].buffer_offset / (4 * sizeof(float));
if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
ret = emit_const_range( svga, shader, offset, count, data );
if (ret != PIPE_OK) {
goto done;
}
} else {
for (i = 0; i < count; i++) {
ret = emit_const( svga, shader, offset + i, data[i] );
if (ret != PIPE_OK) {
goto done;
}
}
}
done:
if (data)
pipe_buffer_unmap(&svga->pipe, transfer);
return ret;
}
static enum pipe_error
emit_fs_consts(struct svga_context *svga, unsigned dirty)
{
struct svga_screen *ss = svga_screen(svga->pipe.screen);
const struct svga_shader_variant *variant = svga->state.hw_draw.fs;
enum pipe_error ret = PIPE_OK;
/* SVGA_NEW_FS_VARIANT
*/
if (variant == NULL)
return PIPE_OK;
/* SVGA_NEW_FS_CONST_BUFFER
*/
ret = emit_consts( svga, PIPE_SHADER_FRAGMENT );
if (ret != PIPE_OK)
return ret;
/* emit extra shader constants */
{
unsigned offset = variant->shader->info.file_max[TGSI_FILE_CONSTANT] + 1;
float extras[MAX_EXTRA_CONSTS][4];
unsigned count, i;
count = svga_get_extra_fs_constants(svga, (float *) extras);
if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
ret = emit_const_range(svga, PIPE_SHADER_FRAGMENT, offset, count,
(const float (*) [4])extras);
} else {
for (i = 0; i < count; i++) {
ret = emit_const(svga, PIPE_SHADER_FRAGMENT, offset + i, extras[i]);
if (ret != PIPE_OK)
return ret;
}
}
}
return ret;
}
struct svga_tracked_state svga_hw_fs_constants =
{
"hw fs params",
(SVGA_NEW_FS_CONST_BUFFER |
SVGA_NEW_FS_VARIANT |
SVGA_NEW_TEXTURE_BINDING),
emit_fs_consts
};
static enum pipe_error
emit_vs_consts(struct svga_context *svga, unsigned dirty)
{
struct svga_screen *ss = svga_screen(svga->pipe.screen);
const struct svga_shader_variant *variant = svga->state.hw_draw.vs;
enum pipe_error ret = PIPE_OK;
/* SVGA_NEW_VS_VARIANT
*/
if (variant == NULL)
return PIPE_OK;
/* SVGA_NEW_VS_CONST_BUFFER
*/
ret = emit_consts( svga, PIPE_SHADER_VERTEX );
if (ret != PIPE_OK)
return ret;
/* emit extra shader constants */
{
unsigned offset = variant->shader->info.file_max[TGSI_FILE_CONSTANT] + 1;
float extras[MAX_EXTRA_CONSTS][4];
unsigned count, i;
count = svga_get_extra_vs_constants(svga, (float *) extras);
assert(count <= Elements(extras));
if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
ret = emit_const_range(svga, PIPE_SHADER_VERTEX, offset, count,
(const float (*) [4]) extras);
} else {
for (i = 0; i < count; i++) {
ret = emit_const(svga, PIPE_SHADER_VERTEX, offset + i, extras[i]);
if (ret != PIPE_OK)
return ret;
}
}
}
return ret;
}
struct svga_tracked_state svga_hw_vs_constants =
{
"hw vs params",
(SVGA_NEW_PRESCALE |
SVGA_NEW_VS_CONST_BUFFER |
SVGA_NEW_VS_VARIANT),
emit_vs_consts
};