/**********************************************************
* Copyright 2008-2009 VMware, Inc. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
* files (the "Software"), to deal in the Software without
* restriction, including without limitation the rights to use, copy,
* modify, merge, publish, distribute, sublicense, and/or sell copies
* of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*
**********************************************************/
#include "draw/draw_context.h"
#include "draw/draw_vbuf.h"
#include "util/u_bitmask.h"
#include "util/u_inlines.h"
#include "pipe/p_state.h"
#include "svga_cmd.h"
#include "svga_context.h"
#include "svga_shader.h"
#include "svga_swtnl.h"
#include "svga_state.h"
#include "svga_tgsi.h"
#include "svga_swtnl_private.h"
#define SVGA_POINT_ADJ_X -0.375f
#define SVGA_POINT_ADJ_Y -0.5f
#define SVGA_LINE_ADJ_X -0.5f
#define SVGA_LINE_ADJ_Y -0.5f
#define SVGA_TRIANGLE_ADJ_X -0.375f
#define SVGA_TRIANGLE_ADJ_Y -0.5f
static void
set_draw_viewport(struct svga_context *svga)
{
struct pipe_viewport_state vp = svga->curr.viewport;
float adjx = 0.0f;
float adjy = 0.0f;
if (svga_have_vgpu10(svga)) {
if (svga->curr.reduced_prim == PIPE_PRIM_TRIANGLES) {
adjy = 0.25;
}
}
else {
switch (svga->curr.reduced_prim) {
case PIPE_PRIM_POINTS:
adjx = SVGA_POINT_ADJ_X;
adjy = SVGA_POINT_ADJ_Y;
break;
case PIPE_PRIM_LINES:
/* XXX: This is to compensate for the fact that wide lines are
* going to be drawn with triangles, but we're not catching all
* cases where that will happen.
*/
if (svga->curr.rast->need_pipeline & SVGA_PIPELINE_FLAG_LINES)
{
adjx = SVGA_LINE_ADJ_X + 0.175f;
adjy = SVGA_LINE_ADJ_Y - 0.175f;
}
else {
adjx = SVGA_LINE_ADJ_X;
adjy = SVGA_LINE_ADJ_Y;
}
break;
case PIPE_PRIM_TRIANGLES:
adjx += SVGA_TRIANGLE_ADJ_X;
adjy += SVGA_TRIANGLE_ADJ_Y;
break;
default:
/* nothing */
break;
}
}
vp.translate[0] += adjx;
vp.translate[1] += adjy;
draw_set_viewport_states(svga->swtnl.draw, 0, 1, &vp);
}
static enum pipe_error
update_swtnl_draw(struct svga_context *svga, unsigned dirty)
{
SVGA_STATS_TIME_PUSH(svga_sws(svga), SVGA_STATS_TIME_SWTNLUPDATEDRAW);
draw_flush(svga->swtnl.draw);
if (dirty & SVGA_NEW_VS)
draw_bind_vertex_shader(svga->swtnl.draw,
svga->curr.vs->draw_shader);
if (dirty & SVGA_NEW_FS)
draw_bind_fragment_shader(svga->swtnl.draw,
svga->curr.fs->draw_shader);
if (dirty & SVGA_NEW_VBUFFER)
draw_set_vertex_buffers(svga->swtnl.draw, 0,
svga->curr.num_vertex_buffers,
svga->curr.vb);
if (dirty & SVGA_NEW_VELEMENT)
draw_set_vertex_elements(svga->swtnl.draw,
svga->curr.velems->count,
svga->curr.velems->velem);
if (dirty & SVGA_NEW_CLIP)
draw_set_clip_state(svga->swtnl.draw,
&svga->curr.clip);
if (dirty & (SVGA_NEW_VIEWPORT |
SVGA_NEW_REDUCED_PRIMITIVE |
SVGA_NEW_RAST))
set_draw_viewport(svga);
if (dirty & SVGA_NEW_RAST)
draw_set_rasterizer_state(svga->swtnl.draw,
&svga->curr.rast->templ,
(void *) svga->curr.rast);
/* Tell the draw module how deep the Z/depth buffer is.
*
* If no depth buffer is bound, send the utility function the
* format for no bound depth (PIPE_FORMAT_NONE).
*/
if (dirty & SVGA_NEW_FRAME_BUFFER)
draw_set_zs_format(svga->swtnl.draw,
(svga->curr.framebuffer.zsbuf) ?
svga->curr.framebuffer.zsbuf->format : PIPE_FORMAT_NONE);
SVGA_STATS_TIME_POP(svga_sws(svga));
return PIPE_OK;
}
struct svga_tracked_state svga_update_swtnl_draw =
{
"update draw module state",
(SVGA_NEW_VS |
SVGA_NEW_VBUFFER |
SVGA_NEW_VELEMENT |
SVGA_NEW_CLIP |
SVGA_NEW_VIEWPORT |
SVGA_NEW_RAST |
SVGA_NEW_FRAME_BUFFER |
SVGA_NEW_REDUCED_PRIMITIVE),
update_swtnl_draw
};
static SVGA3dSurfaceFormat
translate_vertex_format(SVGA3dDeclType format)
{
switch (format) {
case SVGA3D_DECLTYPE_FLOAT1:
return SVGA3D_R32_FLOAT;
case SVGA3D_DECLTYPE_FLOAT2:
return SVGA3D_R32G32_FLOAT;
case SVGA3D_DECLTYPE_FLOAT3:
return SVGA3D_R32G32B32_FLOAT;
case SVGA3D_DECLTYPE_FLOAT4:
return SVGA3D_R32G32B32A32_FLOAT;
default:
assert(!"Unexpected format in translate_vertex_format()");
return SVGA3D_R32G32B32A32_FLOAT;
}
}
static SVGA3dElementLayoutId
svga_vdecl_to_input_element(struct svga_context *svga,
const SVGA3dVertexDecl *vdecl, unsigned num_decls)
{
SVGA3dElementLayoutId id;
SVGA3dInputElementDesc elements[PIPE_MAX_ATTRIBS];
enum pipe_error ret;
unsigned i;
assert(num_decls <= PIPE_MAX_ATTRIBS);
assert(svga_have_vgpu10(svga));
for (i = 0; i < num_decls; i++) {
elements[i].inputSlot = 0; /* vertex buffer index */
elements[i].alignedByteOffset = vdecl[i].array.offset;
elements[i].format = translate_vertex_format(vdecl[i].identity.type);
elements[i].inputSlotClass = SVGA3D_INPUT_PER_VERTEX_DATA;
elements[i].instanceDataStepRate = 0;
elements[i].inputRegister = i;
}
id = util_bitmask_add(svga->input_element_object_id_bm);
ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, num_decls, id, elements);
if (ret != PIPE_OK) {
svga_context_flush(svga, NULL);
ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, num_decls,
id, elements);
assert(ret == PIPE_OK);
}
return id;
}
enum pipe_error
svga_swtnl_update_vdecl(struct svga_context *svga)
{
struct svga_vbuf_render *svga_render = svga_vbuf_render(svga->swtnl.backend);
struct draw_context *draw = svga->swtnl.draw;
struct vertex_info *vinfo = &svga_render->vertex_info;
SVGA3dVertexDecl vdecl[PIPE_MAX_ATTRIBS];
struct svga_fragment_shader *fs = svga->curr.fs;
int offset = 0;
int nr_decls = 0;
int src;
unsigned i;
int any_change;
SVGA_STATS_TIME_PUSH(svga_sws(svga), SVGA_STATS_TIME_SWTNLUPDATEVDECL);
memset(vinfo, 0, sizeof(*vinfo));
memset(vdecl, 0, sizeof(vdecl));
draw_prepare_shader_outputs(draw);
/* always add position */
src = draw_find_shader_output(draw, TGSI_SEMANTIC_POSITION, 0);
draw_emit_vertex_attr(vinfo, EMIT_4F, src);
vinfo->attrib[0].emit = EMIT_4F;
vdecl[0].array.offset = offset;
vdecl[0].identity.method = SVGA3D_DECLMETHOD_DEFAULT;
vdecl[0].identity.type = SVGA3D_DECLTYPE_FLOAT4;
vdecl[0].identity.usage = SVGA3D_DECLUSAGE_POSITIONT;
vdecl[0].identity.usageIndex = 0;
offset += 16;
nr_decls++;
for (i = 0; i < fs->base.info.num_inputs; i++) {
const enum tgsi_semantic sem_name = fs->base.info.input_semantic_name[i];
const unsigned sem_index = fs->base.info.input_semantic_index[i];
src = draw_find_shader_output(draw, sem_name, sem_index);
vdecl[nr_decls].array.offset = offset;
vdecl[nr_decls].identity.usageIndex = sem_index;
switch (sem_name) {
case TGSI_SEMANTIC_COLOR:
draw_emit_vertex_attr(vinfo, EMIT_4F, src);
vdecl[nr_decls].identity.usage = SVGA3D_DECLUSAGE_COLOR;
vdecl[nr_decls].identity.type = SVGA3D_DECLTYPE_FLOAT4;
offset += 16;
nr_decls++;
break;
case TGSI_SEMANTIC_GENERIC:
draw_emit_vertex_attr(vinfo, EMIT_4F, src);
vdecl[nr_decls].identity.usage = SVGA3D_DECLUSAGE_TEXCOORD;
vdecl[nr_decls].identity.type = SVGA3D_DECLTYPE_FLOAT4;
vdecl[nr_decls].identity.usageIndex =
svga_remap_generic_index(fs->generic_remap_table, sem_index);
offset += 16;
nr_decls++;
break;
case TGSI_SEMANTIC_FOG:
draw_emit_vertex_attr(vinfo, EMIT_1F, src);
vdecl[nr_decls].identity.usage = SVGA3D_DECLUSAGE_TEXCOORD;
vdecl[nr_decls].identity.type = SVGA3D_DECLTYPE_FLOAT1;
assert(vdecl[nr_decls].identity.usageIndex == 0);
offset += 4;
nr_decls++;
break;
case TGSI_SEMANTIC_POSITION:
/* generated internally, not a vertex shader output */
break;
default:
assert(0);
}
}
draw_compute_vertex_size(vinfo);
svga_render->vdecl_count = nr_decls;
for (i = 0; i < svga_render->vdecl_count; i++) {
vdecl[i].array.stride = offset;
}
any_change = memcmp(svga_render->vdecl, vdecl, sizeof(vdecl));
if (svga_have_vgpu10(svga)) {
enum pipe_error ret;
if (!any_change && svga_render->layout_id != SVGA3D_INVALID_ID) {
goto done;
}
if (svga_render->layout_id != SVGA3D_INVALID_ID) {
/* destroy old */
ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc,
svga_render->layout_id);
if (ret != PIPE_OK) {
svga_context_flush(svga, NULL);
ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc,
svga_render->layout_id);
assert(ret == PIPE_OK);
}
/**
* reset current layout id state after the element layout is
* destroyed, so that if a new layout has the same layout id, we
* will know to re-issue the SetInputLayout command.
*/
if (svga->state.hw_draw.layout_id == svga_render->layout_id)
svga->state.hw_draw.layout_id = SVGA3D_INVALID_ID;
util_bitmask_clear(svga->input_element_object_id_bm,
svga_render->layout_id);
}
svga_render->layout_id =
svga_vdecl_to_input_element(svga, vdecl, nr_decls);
/* bind new */
if (svga->state.hw_draw.layout_id != svga_render->layout_id) {
ret = SVGA3D_vgpu10_SetInputLayout(svga->swc, svga_render->layout_id);
if (ret != PIPE_OK) {
svga_context_flush(svga, NULL);
ret = SVGA3D_vgpu10_SetInputLayout(svga->swc,
svga_render->layout_id);
assert(ret == PIPE_OK);
}
svga->state.hw_draw.layout_id = svga_render->layout_id;
}
}
else {
if (!any_change)
goto done;
}
memcpy(svga_render->vdecl, vdecl, sizeof(vdecl));
svga->swtnl.new_vdecl = TRUE;
done:
SVGA_STATS_TIME_POP(svga_sws(svga));
return PIPE_OK;
}
static enum pipe_error
update_swtnl_vdecl(struct svga_context *svga, unsigned dirty)
{
return svga_swtnl_update_vdecl(svga);
}
struct svga_tracked_state svga_update_swtnl_vdecl =
{
"update draw module vdecl",
(SVGA_NEW_VS |
SVGA_NEW_FS),
update_swtnl_vdecl
};