blob: 9d2b1a8f67c3208455ef426c49486bfc579cd16f [file] [log] [blame]
/*
* Copyright 2011 Joakim Sindholt <opensource@zhasha.com>
* Copyright 2013 Christoph Bumiller
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* on the rights to use, copy, modify, merge, publish, distribute, sub
* license, and/or sell copies of the Software, and to permit persons to whom
* the Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice (including the next
* paragraph) shall be included in all copies or substantial portions of the
* Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
* USE OR OTHER DEALINGS IN THE SOFTWARE. */
#include "device9.h"
#include "basetexture9.h"
#include "buffer9.h"
#include "indexbuffer9.h"
#include "surface9.h"
#include "vertexbuffer9.h"
#include "vertexdeclaration9.h"
#include "vertexshader9.h"
#include "pixelshader9.h"
#include "nine_pipe.h"
#include "nine_ff.h"
#include "nine_limits.h"
#include "pipe/p_context.h"
#include "pipe/p_state.h"
#include "cso_cache/cso_context.h"
#include "util/u_upload_mgr.h"
#include "util/u_math.h"
#include "util/u_box.h"
#include "util/u_simple_shaders.h"
#define DBG_CHANNEL DBG_DEVICE
/* Check if some states need to be set dirty */
static inline DWORD
check_multisample(struct NineDevice9 *device)
{
DWORD *rs = device->context.rs;
DWORD new_value = (rs[D3DRS_ZENABLE] || rs[D3DRS_STENCILENABLE]) &&
device->context.rt[0]->desc.MultiSampleType >= 1 &&
rs[D3DRS_MULTISAMPLEANTIALIAS];
if (rs[NINED3DRS_MULTISAMPLE] != new_value) {
rs[NINED3DRS_MULTISAMPLE] = new_value;
return NINE_STATE_RASTERIZER;
}
return 0;
}
/* State preparation only */
static inline void
prepare_blend(struct NineDevice9 *device)
{
nine_convert_blend_state(&device->context.pipe_data.blend, device->context.rs);
device->context.commit |= NINE_STATE_COMMIT_BLEND;
}
static inline void
prepare_dsa(struct NineDevice9 *device)
{
nine_convert_dsa_state(&device->context.pipe_data.dsa, device->context.rs);
device->context.commit |= NINE_STATE_COMMIT_DSA;
}
static inline void
prepare_rasterizer(struct NineDevice9 *device)
{
nine_convert_rasterizer_state(device, &device->context.pipe_data.rast, device->context.rs);
device->context.commit |= NINE_STATE_COMMIT_RASTERIZER;
}
static void
prepare_vs_constants_userbuf_swvp(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
if (context->changed.vs_const_f || context->changed.group & NINE_STATE_SWVP) {
struct pipe_constant_buffer cb;
cb.buffer_offset = 0;
cb.buffer_size = 4096 * sizeof(float[4]);
cb.user_buffer = context->vs_const_f_swvp;
if (context->vs->lconstf.ranges) {
const struct nine_lconstf *lconstf = &(context->vs->lconstf);
const struct nine_range *r = lconstf->ranges;
unsigned n = 0;
float *dst = context->vs_lconstf_temp;
float *src = (float *)cb.user_buffer;
memcpy(dst, src, cb.buffer_size);
while (r) {
unsigned p = r->bgn;
unsigned c = r->end - r->bgn;
memcpy(&dst[p * 4], &lconstf->data[n * 4], c * 4 * sizeof(float));
n += c;
r = r->next;
}
cb.user_buffer = dst;
}
/* Do not erase the buffer field.
* It is either NULL (user_cbufs), or a resource.
* u_upload_data will do the proper refcount */
context->pipe_data.cb0_swvp.buffer_offset = cb.buffer_offset;
context->pipe_data.cb0_swvp.buffer_size = cb.buffer_size;
context->pipe_data.cb0_swvp.user_buffer = cb.user_buffer;
cb.user_buffer = (char *)cb.user_buffer + 4096 * sizeof(float[4]);
context->pipe_data.cb1_swvp.buffer_offset = cb.buffer_offset;
context->pipe_data.cb1_swvp.buffer_size = cb.buffer_size;
context->pipe_data.cb1_swvp.user_buffer = cb.user_buffer;
context->changed.vs_const_f = 0;
}
if (context->changed.vs_const_i || context->changed.group & NINE_STATE_SWVP) {
struct pipe_constant_buffer cb;
cb.buffer_offset = 0;
cb.buffer_size = 2048 * sizeof(float[4]);
cb.user_buffer = context->vs_const_i;
context->pipe_data.cb2_swvp.buffer_offset = cb.buffer_offset;
context->pipe_data.cb2_swvp.buffer_size = cb.buffer_size;
context->pipe_data.cb2_swvp.user_buffer = cb.user_buffer;
context->changed.vs_const_i = 0;
}
if (context->changed.vs_const_b || context->changed.group & NINE_STATE_SWVP) {
struct pipe_constant_buffer cb;
cb.buffer_offset = 0;
cb.buffer_size = 512 * sizeof(float[4]);
cb.user_buffer = context->vs_const_b;
context->pipe_data.cb3_swvp.buffer_offset = cb.buffer_offset;
context->pipe_data.cb3_swvp.buffer_size = cb.buffer_size;
context->pipe_data.cb3_swvp.user_buffer = cb.user_buffer;
context->changed.vs_const_b = 0;
}
if (!device->driver_caps.user_cbufs) {
struct pipe_constant_buffer *cb = &(context->pipe_data.cb0_swvp);
u_upload_data(device->constbuf_uploader,
0,
cb->buffer_size,
device->constbuf_alignment,
cb->user_buffer,
&(cb->buffer_offset),
&(cb->buffer));
u_upload_unmap(device->constbuf_uploader);
cb->user_buffer = NULL;
cb = &(context->pipe_data.cb1_swvp);
u_upload_data(device->constbuf_uploader,
0,
cb->buffer_size,
device->constbuf_alignment,
cb->user_buffer,
&(cb->buffer_offset),
&(cb->buffer));
u_upload_unmap(device->constbuf_uploader);
cb->user_buffer = NULL;
cb = &(context->pipe_data.cb2_swvp);
u_upload_data(device->constbuf_uploader,
0,
cb->buffer_size,
device->constbuf_alignment,
cb->user_buffer,
&(cb->buffer_offset),
&(cb->buffer));
u_upload_unmap(device->constbuf_uploader);
cb->user_buffer = NULL;
cb = &(context->pipe_data.cb3_swvp);
u_upload_data(device->constbuf_uploader,
0,
cb->buffer_size,
device->constbuf_alignment,
cb->user_buffer,
&(cb->buffer_offset),
&(cb->buffer));
u_upload_unmap(device->constbuf_uploader);
cb->user_buffer = NULL;
}
context->changed.group &= ~NINE_STATE_VS_CONST;
context->commit |= NINE_STATE_COMMIT_CONST_VS;
}
static void
prepare_vs_constants_userbuf(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
struct pipe_constant_buffer cb;
cb.buffer = NULL;
cb.buffer_offset = 0;
cb.buffer_size = context->vs->const_used_size;
cb.user_buffer = context->vs_const_f;
if (device->swvp) {
prepare_vs_constants_userbuf_swvp(device);
return;
}
if (context->changed.vs_const_i || context->changed.group & NINE_STATE_SWVP) {
int *idst = (int *)&context->vs_const_f[4 * device->max_vs_const_f];
memcpy(idst, context->vs_const_i, NINE_MAX_CONST_I * sizeof(int[4]));
context->changed.vs_const_i = 0;
}
if (context->changed.vs_const_b || context->changed.group & NINE_STATE_SWVP) {
int *idst = (int *)&context->vs_const_f[4 * device->max_vs_const_f];
uint32_t *bdst = (uint32_t *)&idst[4 * NINE_MAX_CONST_I];
memcpy(bdst, context->vs_const_b, NINE_MAX_CONST_B * sizeof(BOOL));
context->changed.vs_const_b = 0;
}
if (!cb.buffer_size)
return;
if (context->vs->lconstf.ranges) {
/* TODO: Can we make it so that we don't have to copy everything ? */
const struct nine_lconstf *lconstf = &(context->vs->lconstf);
const struct nine_range *r = lconstf->ranges;
unsigned n = 0;
float *dst = context->vs_lconstf_temp;
float *src = (float *)cb.user_buffer;
memcpy(dst, src, cb.buffer_size);
while (r) {
unsigned p = r->bgn;
unsigned c = r->end - r->bgn;
memcpy(&dst[p * 4], &lconstf->data[n * 4], c * 4 * sizeof(float));
n += c;
r = r->next;
}
cb.user_buffer = dst;
}
if (!device->driver_caps.user_cbufs) {
context->pipe_data.cb_vs.buffer_size = cb.buffer_size;
u_upload_data(device->constbuf_uploader,
0,
cb.buffer_size,
device->constbuf_alignment,
cb.user_buffer,
&context->pipe_data.cb_vs.buffer_offset,
&context->pipe_data.cb_vs.buffer);
u_upload_unmap(device->constbuf_uploader);
context->pipe_data.cb_vs.user_buffer = NULL;
} else
context->pipe_data.cb_vs = cb;
context->changed.vs_const_f = 0;
context->changed.group &= ~NINE_STATE_VS_CONST;
context->commit |= NINE_STATE_COMMIT_CONST_VS;
}
static void
prepare_ps_constants_userbuf(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
struct pipe_constant_buffer cb;
cb.buffer = NULL;
cb.buffer_offset = 0;
cb.buffer_size = context->ps->const_used_size;
cb.user_buffer = context->ps_const_f;
if (context->changed.ps_const_i) {
int *idst = (int *)&context->ps_const_f[4 * device->max_ps_const_f];
memcpy(idst, context->ps_const_i, sizeof(context->ps_const_i));
context->changed.ps_const_i = 0;
}
if (context->changed.ps_const_b) {
int *idst = (int *)&context->ps_const_f[4 * device->max_ps_const_f];
uint32_t *bdst = (uint32_t *)&idst[4 * NINE_MAX_CONST_I];
memcpy(bdst, context->ps_const_b, sizeof(context->ps_const_b));
context->changed.ps_const_b = 0;
}
/* Upload special constants needed to implement PS1.x instructions like TEXBEM,TEXBEML and BEM */
if (context->ps->bumpenvmat_needed) {
memcpy(context->ps_lconstf_temp, cb.user_buffer, cb.buffer_size);
memcpy(&context->ps_lconstf_temp[4 * 8], &device->context.bumpmap_vars, sizeof(device->context.bumpmap_vars));
cb.user_buffer = context->ps_lconstf_temp;
}
if (context->ps->byte_code.version < 0x30 &&
context->rs[D3DRS_FOGENABLE]) {
float *dst = &context->ps_lconstf_temp[4 * 32];
if (cb.user_buffer != context->ps_lconstf_temp) {
memcpy(context->ps_lconstf_temp, cb.user_buffer, cb.buffer_size);
cb.user_buffer = context->ps_lconstf_temp;
}
d3dcolor_to_rgba(dst, context->rs[D3DRS_FOGCOLOR]);
if (context->rs[D3DRS_FOGTABLEMODE] == D3DFOG_LINEAR) {
dst[4] = asfloat(context->rs[D3DRS_FOGEND]);
dst[5] = 1.0f / (asfloat(context->rs[D3DRS_FOGEND]) - asfloat(context->rs[D3DRS_FOGSTART]));
} else if (context->rs[D3DRS_FOGTABLEMODE] != D3DFOG_NONE) {
dst[4] = asfloat(context->rs[D3DRS_FOGDENSITY]);
}
cb.buffer_size = 4 * 4 * 34;
}
if (!cb.buffer_size)
return;
if (!device->driver_caps.user_cbufs) {
context->pipe_data.cb_ps.buffer_size = cb.buffer_size;
u_upload_data(device->constbuf_uploader,
0,
cb.buffer_size,
device->constbuf_alignment,
cb.user_buffer,
&context->pipe_data.cb_ps.buffer_offset,
&context->pipe_data.cb_ps.buffer);
u_upload_unmap(device->constbuf_uploader);
context->pipe_data.cb_ps.user_buffer = NULL;
} else
context->pipe_data.cb_ps = cb;
context->changed.ps_const_f = 0;
context->changed.group &= ~NINE_STATE_PS_CONST;
context->commit |= NINE_STATE_COMMIT_CONST_PS;
}
static inline uint32_t
prepare_vs(struct NineDevice9 *device, uint8_t shader_changed)
{
struct nine_context *context = &device->context;
struct NineVertexShader9 *vs = context->vs;
uint32_t changed_group = 0;
int has_key_changed = 0;
if (likely(context->programmable_vs))
has_key_changed = NineVertexShader9_UpdateKey(vs, device);
if (!shader_changed && !has_key_changed)
return 0;
/* likely because we dislike FF */
if (likely(context->programmable_vs)) {
context->cso_shader.vs = NineVertexShader9_GetVariant(vs);
} else {
vs = device->ff.vs;
context->cso_shader.vs = vs->ff_cso;
}
if (context->rs[NINED3DRS_VSPOINTSIZE] != vs->point_size) {
context->rs[NINED3DRS_VSPOINTSIZE] = vs->point_size;
changed_group |= NINE_STATE_RASTERIZER;
}
if ((context->bound_samplers_mask_vs & vs->sampler_mask) != vs->sampler_mask)
/* Bound dummy sampler. */
changed_group |= NINE_STATE_SAMPLER;
context->commit |= NINE_STATE_COMMIT_VS;
return changed_group;
}
static inline uint32_t
prepare_ps(struct NineDevice9 *device, uint8_t shader_changed)
{
struct nine_context *context = &device->context;
struct NinePixelShader9 *ps = context->ps;
uint32_t changed_group = 0;
int has_key_changed = 0;
if (likely(ps))
has_key_changed = NinePixelShader9_UpdateKey(ps, context);
if (!shader_changed && !has_key_changed)
return 0;
if (likely(ps)) {
context->cso_shader.ps = NinePixelShader9_GetVariant(ps);
} else {
ps = device->ff.ps;
context->cso_shader.ps = ps->ff_cso;
}
if ((context->bound_samplers_mask_ps & ps->sampler_mask) != ps->sampler_mask)
/* Bound dummy sampler. */
changed_group |= NINE_STATE_SAMPLER;
context->commit |= NINE_STATE_COMMIT_PS;
return changed_group;
}
/* State preparation incremental */
/* State preparation + State commit */
static void
update_framebuffer(struct NineDevice9 *device, bool is_clear)
{
struct pipe_context *pipe = device->pipe;
struct nine_context *context = &device->context;
struct pipe_framebuffer_state *fb = &context->pipe_data.fb;
unsigned i;
struct NineSurface9 *rt0 = context->rt[0];
unsigned w = rt0->desc.Width;
unsigned h = rt0->desc.Height;
unsigned nr_samples = rt0->base.info.nr_samples;
unsigned ps_mask = context->ps ? context->ps->rt_mask : 1;
unsigned mask = is_clear ? 0xf : ps_mask;
const int sRGB = context->rs[D3DRS_SRGBWRITEENABLE] ? 1 : 0;
DBG("\n");
context->rt_mask = 0x0;
fb->nr_cbufs = 0;
/* all render targets must have the same size and the depth buffer must be
* bigger. Multisample has to match, according to spec. But some apps do
* things wrong there, and no error is returned. The behaviour they get
* apparently is that depth buffer is disabled if it doesn't match.
* Surely the same for render targets. */
/* Special case: D3DFMT_NULL is used to bound no real render target,
* but render to depth buffer. We have to not take into account the render
* target info. TODO: know what should happen when there are several render targers
* and the first one is D3DFMT_NULL */
if (rt0->desc.Format == D3DFMT_NULL && context->ds) {
w = context->ds->desc.Width;
h = context->ds->desc.Height;
nr_samples = context->ds->base.info.nr_samples;
}
for (i = 0; i < device->caps.NumSimultaneousRTs; ++i) {
struct NineSurface9 *rt = context->rt[i];
if (rt && rt->desc.Format != D3DFMT_NULL && (mask & (1 << i)) &&
rt->desc.Width == w && rt->desc.Height == h &&
rt->base.info.nr_samples == nr_samples) {
fb->cbufs[i] = NineSurface9_GetSurface(rt, sRGB);
context->rt_mask |= 1 << i;
fb->nr_cbufs = i + 1;
if (unlikely(rt->desc.Usage & D3DUSAGE_AUTOGENMIPMAP)) {
assert(rt->texture == D3DRTYPE_TEXTURE ||
rt->texture == D3DRTYPE_CUBETEXTURE);
NineBaseTexture9(rt->base.base.container)->dirty_mip = TRUE;
}
} else {
/* Color outputs must match RT slot,
* drivers will have to handle NULL entries for GL, too.
*/
fb->cbufs[i] = NULL;
}
}
if (context->ds && context->ds->desc.Width >= w &&
context->ds->desc.Height >= h &&
context->ds->base.info.nr_samples == nr_samples) {
fb->zsbuf = NineSurface9_GetSurface(context->ds, 0);
} else {
fb->zsbuf = NULL;
}
fb->width = w;
fb->height = h;
pipe->set_framebuffer_state(pipe, fb); /* XXX: cso ? */
if (is_clear && context->rt_mask == ps_mask)
context->changed.group &= ~NINE_STATE_FB;
}
static void
update_viewport(struct NineDevice9 *device)
{
const D3DVIEWPORT9 *vport = &device->context.viewport;
struct pipe_viewport_state pvport;
/* D3D coordinates are:
* -1 .. +1 for X,Y and
* 0 .. +1 for Z (we use pipe_rasterizer_state.clip_halfz)
*/
pvport.scale[0] = (float)vport->Width * 0.5f;
pvport.scale[1] = (float)vport->Height * -0.5f;
pvport.scale[2] = vport->MaxZ - vport->MinZ;
pvport.translate[0] = (float)vport->Width * 0.5f + (float)vport->X;
pvport.translate[1] = (float)vport->Height * 0.5f + (float)vport->Y;
pvport.translate[2] = vport->MinZ;
/* We found R600 and SI cards have some imprecision
* on the barycentric coordinates used for interpolation.
* Some shaders rely on having something precise.
* We found that the proprietary driver has the imprecision issue,
* except when the render target width and height are powers of two.
* It is using some sort of workaround for these cases
* which covers likely all the cases the applications rely
* on something precise.
* We haven't found the workaround, but it seems like it's better
* for applications if the imprecision is biased towards infinity
* instead of -infinity (which is what measured). So shift slightly
* the viewport: not enough to change rasterization result (in particular
* for multisampling), but enough to make the imprecision biased
* towards infinity. We do this shift only if render target width and
* height are powers of two.
* Solves 'red shadows' bug on UE3 games.
*/
if (device->driver_bugs.buggy_barycentrics &&
((vport->Width & (vport->Width-1)) == 0) &&
((vport->Height & (vport->Height-1)) == 0)) {
pvport.translate[0] -= 1.0f / 128.0f;
pvport.translate[1] -= 1.0f / 128.0f;
}
cso_set_viewport(device->cso, &pvport);
}
/* Loop through VS inputs and pick the vertex elements with the declared
* usage from the vertex declaration, then insert the instance divisor from
* the stream source frequency setting.
*/
static void
update_vertex_elements(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
const struct NineVertexDeclaration9 *vdecl = device->context.vdecl;
const struct NineVertexShader9 *vs;
unsigned n, b, i;
int index;
char vdecl_index_map[16]; /* vs->num_inputs <= 16 */
char used_streams[device->caps.MaxStreams];
int dummy_vbo_stream = -1;
BOOL need_dummy_vbo = FALSE;
struct pipe_vertex_element ve[PIPE_MAX_ATTRIBS];
context->stream_usage_mask = 0;
memset(vdecl_index_map, -1, 16);
memset(used_streams, 0, device->caps.MaxStreams);
vs = context->programmable_vs ? context->vs : device->ff.vs;
if (vdecl) {
for (n = 0; n < vs->num_inputs; ++n) {
DBG("looking up input %u (usage %u) from vdecl(%p)\n",
n, vs->input_map[n].ndecl, vdecl);
for (i = 0; i < vdecl->nelems; i++) {
if (vdecl->usage_map[i] == vs->input_map[n].ndecl) {
vdecl_index_map[n] = i;
used_streams[vdecl->elems[i].vertex_buffer_index] = 1;
break;
}
}
if (vdecl_index_map[n] < 0)
need_dummy_vbo = TRUE;
}
} else {
/* No vertex declaration. Likely will never happen in practice,
* but we need not crash on this */
need_dummy_vbo = TRUE;
}
if (need_dummy_vbo) {
for (i = 0; i < device->caps.MaxStreams; i++ ) {
if (!used_streams[i]) {
dummy_vbo_stream = i;
break;
}
}
}
/* there are less vertex shader inputs than stream slots,
* so if we need a slot for the dummy vbo, we should have found one */
assert (!need_dummy_vbo || dummy_vbo_stream != -1);
for (n = 0; n < vs->num_inputs; ++n) {
index = vdecl_index_map[n];
if (index >= 0) {
ve[n] = vdecl->elems[index];
b = ve[n].vertex_buffer_index;
context->stream_usage_mask |= 1 << b;
/* XXX wine just uses 1 here: */
if (context->stream_freq[b] & D3DSTREAMSOURCE_INSTANCEDATA)
ve[n].instance_divisor = context->stream_freq[b] & 0x7FFFFF;
} else {
/* if the vertex declaration is incomplete compared to what the
* vertex shader needs, we bind a dummy vbo with 0 0 0 0.
* This is not precised by the spec, but is the behaviour
* tested on win */
ve[n].vertex_buffer_index = dummy_vbo_stream;
ve[n].src_format = PIPE_FORMAT_R32G32B32A32_FLOAT;
ve[n].src_offset = 0;
ve[n].instance_divisor = 0;
}
}
if (context->dummy_vbo_bound_at != dummy_vbo_stream) {
if (context->dummy_vbo_bound_at >= 0)
context->changed.vtxbuf |= 1 << context->dummy_vbo_bound_at;
if (dummy_vbo_stream >= 0) {
context->changed.vtxbuf |= 1 << dummy_vbo_stream;
context->vbo_bound_done = FALSE;
}
context->dummy_vbo_bound_at = dummy_vbo_stream;
}
cso_set_vertex_elements(device->cso, vs->num_inputs, ve);
}
static void
update_vertex_buffers(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
struct nine_context *context = &device->context;
struct pipe_vertex_buffer dummy_vtxbuf;
uint32_t mask = context->changed.vtxbuf;
unsigned i;
DBG("mask=%x\n", mask);
if (context->dummy_vbo_bound_at >= 0) {
if (!context->vbo_bound_done) {
dummy_vtxbuf.buffer = device->dummy_vbo;
dummy_vtxbuf.stride = 0;
dummy_vtxbuf.user_buffer = NULL;
dummy_vtxbuf.buffer_offset = 0;
pipe->set_vertex_buffers(pipe, context->dummy_vbo_bound_at,
1, &dummy_vtxbuf);
context->vbo_bound_done = TRUE;
}
mask &= ~(1 << context->dummy_vbo_bound_at);
}
for (i = 0; mask; mask >>= 1, ++i) {
if (mask & 1) {
if (context->vtxbuf[i].buffer)
pipe->set_vertex_buffers(pipe, i, 1, &context->vtxbuf[i]);
else
pipe->set_vertex_buffers(pipe, i, 1, NULL);
}
}
context->changed.vtxbuf = 0;
}
static inline boolean
update_sampler_derived(struct nine_context *context, unsigned s)
{
boolean changed = FALSE;
if (context->samp[s][NINED3DSAMP_SHADOW] != context->texture[s]->shadow) {
changed = TRUE;
context->samp[s][NINED3DSAMP_SHADOW] = context->texture[s]->shadow;
}
if (context->samp[s][NINED3DSAMP_CUBETEX] !=
(NineResource9(context->texture[s])->type == D3DRTYPE_CUBETEXTURE)) {
changed = TRUE;
context->samp[s][NINED3DSAMP_CUBETEX] =
NineResource9(context->texture[s])->type == D3DRTYPE_CUBETEXTURE;
}
if (context->samp[s][D3DSAMP_MIPFILTER] != D3DTEXF_NONE) {
int lod = context->samp[s][D3DSAMP_MAXMIPLEVEL] - context->texture[s]->managed.lod;
if (lod < 0)
lod = 0;
if (context->samp[s][NINED3DSAMP_MINLOD] != lod) {
changed = TRUE;
context->samp[s][NINED3DSAMP_MINLOD] = lod;
}
} else {
context->changed.sampler[s] &= ~0x300; /* lod changes irrelevant */
}
return changed;
}
/* TODO: add sRGB override to pipe_sampler_state ? */
static void
update_textures_and_samplers(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
struct pipe_sampler_view *view[NINE_MAX_SAMPLERS];
unsigned num_textures;
unsigned i;
boolean commit_samplers;
uint16_t sampler_mask = context->ps ? context->ps->sampler_mask :
device->ff.ps->sampler_mask;
/* TODO: Can we reduce iterations here ? */
commit_samplers = FALSE;
context->bound_samplers_mask_ps = 0;
for (num_textures = 0, i = 0; i < NINE_MAX_SAMPLERS_PS; ++i) {
const unsigned s = NINE_SAMPLER_PS(i);
int sRGB;
if (!context->texture[s] && !(sampler_mask & (1 << i))) {
view[i] = NULL;
continue;
}
if (context->texture[s]) {
sRGB = context->samp[s][D3DSAMP_SRGBTEXTURE] ? 1 : 0;
view[i] = NineBaseTexture9_GetSamplerView(context->texture[s], sRGB);
num_textures = i + 1;
if (update_sampler_derived(context, s) || (context->changed.sampler[s] & 0x05fe)) {
context->changed.sampler[s] = 0;
commit_samplers = TRUE;
nine_convert_sampler_state(device->cso, s, context->samp[s]);
}
} else {
/* Bind dummy sampler. We do not bind dummy sampler when
* it is not needed because it could add overhead. The
* dummy sampler should have r=g=b=0 and a=1. We do not
* unbind dummy sampler directly when they are not needed
* anymore, but they're going to be removed as long as texture
* or sampler states are changed. */
view[i] = device->dummy_sampler_view;
num_textures = i + 1;
cso_single_sampler(device->cso, PIPE_SHADER_FRAGMENT,
s - NINE_SAMPLER_PS(0), &device->dummy_sampler_state);
commit_samplers = TRUE;
context->changed.sampler[s] = ~0;
}
context->bound_samplers_mask_ps |= (1 << s);
}
cso_set_sampler_views(device->cso, PIPE_SHADER_FRAGMENT, num_textures, view);
if (commit_samplers)
cso_single_sampler_done(device->cso, PIPE_SHADER_FRAGMENT);
commit_samplers = FALSE;
sampler_mask = context->programmable_vs ? context->vs->sampler_mask : 0;
context->bound_samplers_mask_vs = 0;
for (num_textures = 0, i = 0; i < NINE_MAX_SAMPLERS_VS; ++i) {
const unsigned s = NINE_SAMPLER_VS(i);
int sRGB;
if (!context->texture[s] && !(sampler_mask & (1 << i))) {
view[i] = NULL;
continue;
}
if (context->texture[s]) {
sRGB = context->samp[s][D3DSAMP_SRGBTEXTURE] ? 1 : 0;
view[i] = NineBaseTexture9_GetSamplerView(context->texture[s], sRGB);
num_textures = i + 1;
if (update_sampler_derived(context, s) || (context->changed.sampler[s] & 0x05fe)) {
context->changed.sampler[s] = 0;
commit_samplers = TRUE;
nine_convert_sampler_state(device->cso, s, context->samp[s]);
}
} else {
/* Bind dummy sampler. We do not bind dummy sampler when
* it is not needed because it could add overhead. The
* dummy sampler should have r=g=b=0 and a=1. We do not
* unbind dummy sampler directly when they are not needed
* anymore, but they're going to be removed as long as texture
* or sampler states are changed. */
view[i] = device->dummy_sampler_view;
num_textures = i + 1;
cso_single_sampler(device->cso, PIPE_SHADER_VERTEX,
s - NINE_SAMPLER_VS(0), &device->dummy_sampler_state);
commit_samplers = TRUE;
context->changed.sampler[s] = ~0;
}
context->bound_samplers_mask_vs |= (1 << s);
}
cso_set_sampler_views(device->cso, PIPE_SHADER_VERTEX, num_textures, view);
if (commit_samplers)
cso_single_sampler_done(device->cso, PIPE_SHADER_VERTEX);
}
/* State commit only */
static inline void
commit_blend(struct NineDevice9 *device)
{
cso_set_blend(device->cso, &device->context.pipe_data.blend);
}
static inline void
commit_dsa(struct NineDevice9 *device)
{
cso_set_depth_stencil_alpha(device->cso, &device->context.pipe_data.dsa);
}
static inline void
commit_scissor(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
pipe->set_scissor_states(pipe, 0, 1, &device->context.scissor);
}
static inline void
commit_rasterizer(struct NineDevice9 *device)
{
cso_set_rasterizer(device->cso, &device->context.pipe_data.rast);
}
static inline void
commit_index_buffer(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
if (device->context.idxbuf.buffer)
pipe->set_index_buffer(pipe, &device->context.idxbuf);
else
pipe->set_index_buffer(pipe, NULL);
}
static inline void
commit_vs_constants(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
if (unlikely(!device->context.programmable_vs))
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 0, &device->context.pipe_data.cb_vs_ff);
else {
if (device->swvp) {
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 0, &device->context.pipe_data.cb0_swvp);
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 1, &device->context.pipe_data.cb1_swvp);
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 2, &device->context.pipe_data.cb2_swvp);
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 3, &device->context.pipe_data.cb3_swvp);
} else {
pipe->set_constant_buffer(pipe, PIPE_SHADER_VERTEX, 0, &device->context.pipe_data.cb_vs);
}
}
}
static inline void
commit_ps_constants(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
if (unlikely(!device->context.ps))
pipe->set_constant_buffer(pipe, PIPE_SHADER_FRAGMENT, 0, &device->context.pipe_data.cb_ps_ff);
else
pipe->set_constant_buffer(pipe, PIPE_SHADER_FRAGMENT, 0, &device->context.pipe_data.cb_ps);
}
static inline void
commit_vs(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
device->pipe->bind_vs_state(device->pipe, context->cso_shader.vs);
}
static inline void
commit_ps(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
device->pipe->bind_fs_state(device->pipe, context->cso_shader.ps);
}
/* State Update */
#define NINE_STATE_SHADER_CHANGE_VS \
(NINE_STATE_VS | \
NINE_STATE_TEXTURE | \
NINE_STATE_FOG_SHADER | \
NINE_STATE_POINTSIZE_SHADER | \
NINE_STATE_SWVP)
#define NINE_STATE_SHADER_CHANGE_PS \
(NINE_STATE_PS | \
NINE_STATE_TEXTURE | \
NINE_STATE_FOG_SHADER | \
NINE_STATE_PS1X_SHADER)
#define NINE_STATE_FREQUENT \
(NINE_STATE_RASTERIZER | \
NINE_STATE_TEXTURE | \
NINE_STATE_SAMPLER | \
NINE_STATE_VS_CONST | \
NINE_STATE_PS_CONST | \
NINE_STATE_MULTISAMPLE)
#define NINE_STATE_COMMON \
(NINE_STATE_FB | \
NINE_STATE_BLEND | \
NINE_STATE_DSA | \
NINE_STATE_VIEWPORT | \
NINE_STATE_VDECL | \
NINE_STATE_IDXBUF | \
NINE_STATE_STREAMFREQ)
#define NINE_STATE_RARE \
(NINE_STATE_SCISSOR | \
NINE_STATE_BLEND_COLOR | \
NINE_STATE_STENCIL_REF | \
NINE_STATE_SAMPLE_MASK)
/* TODO: only go through dirty textures */
static void
validate_textures(struct NineDevice9 *device)
{
struct NineBaseTexture9 *tex, *ptr;
LIST_FOR_EACH_ENTRY_SAFE(tex, ptr, &device->update_textures, list) {
list_delinit(&tex->list);
NineBaseTexture9_Validate(tex);
}
}
static void
update_managed_buffers(struct NineDevice9 *device)
{
struct NineBuffer9 *buf, *ptr;
LIST_FOR_EACH_ENTRY_SAFE(buf, ptr, &device->update_buffers, managed.list) {
list_delinit(&buf->managed.list);
NineBuffer9_Upload(buf);
}
}
static void
nine_update_state(struct NineDevice9 *device)
{
struct pipe_context *pipe = device->pipe;
struct nine_context *context = &device->context;
uint32_t group;
DBG("changed state groups: %x\n", context->changed.group);
/* NOTE: We may want to use the cso cache for everything, or let
* NineDevice9.RestoreNonCSOState actually set the states, then we wouldn't
* have to care about state being clobbered here and could merge this back
* into update_textures. Except, we also need to re-validate textures that
* may be dirty anyway, even if no texture bindings changed.
*/
validate_textures(device); /* may clobber state */
update_managed_buffers(device);
/* ff_update may change VS/PS dirty bits */
if (unlikely(!context->programmable_vs || !context->ps))
nine_ff_update(device);
group = context->changed.group;
if (group & (NINE_STATE_SHADER_CHANGE_VS | NINE_STATE_SHADER_CHANGE_PS)) {
if (group & NINE_STATE_SHADER_CHANGE_VS)
group |= prepare_vs(device, (group & NINE_STATE_VS) != 0); /* may set NINE_STATE_RASTERIZER and NINE_STATE_SAMPLER*/
if (group & NINE_STATE_SHADER_CHANGE_PS)
group |= prepare_ps(device, (group & NINE_STATE_PS) != 0);
}
if (group & (NINE_STATE_COMMON | NINE_STATE_VS)) {
if (group & NINE_STATE_FB)
update_framebuffer(device, FALSE);
if (group & NINE_STATE_BLEND)
prepare_blend(device);
if (group & NINE_STATE_DSA)
prepare_dsa(device);
if (group & NINE_STATE_VIEWPORT)
update_viewport(device);
if (group & (NINE_STATE_VDECL | NINE_STATE_VS | NINE_STATE_STREAMFREQ))
update_vertex_elements(device);
if (group & NINE_STATE_IDXBUF)
commit_index_buffer(device);
}
if (likely(group & (NINE_STATE_FREQUENT | NINE_STATE_VS | NINE_STATE_PS | NINE_STATE_SWVP))) {
if (group & NINE_STATE_MULTISAMPLE)
group |= check_multisample(device);
if (group & NINE_STATE_RASTERIZER)
prepare_rasterizer(device);
if (group & (NINE_STATE_TEXTURE | NINE_STATE_SAMPLER))
update_textures_and_samplers(device);
if ((group & (NINE_STATE_VS_CONST | NINE_STATE_VS | NINE_STATE_SWVP)) && context->programmable_vs)
prepare_vs_constants_userbuf(device);
if ((group & (NINE_STATE_PS_CONST | NINE_STATE_PS)) && context->ps)
prepare_ps_constants_userbuf(device);
}
if (context->changed.vtxbuf)
update_vertex_buffers(device);
if (context->commit & NINE_STATE_COMMIT_BLEND)
commit_blend(device);
if (context->commit & NINE_STATE_COMMIT_DSA)
commit_dsa(device);
if (context->commit & NINE_STATE_COMMIT_RASTERIZER)
commit_rasterizer(device);
if (context->commit & NINE_STATE_COMMIT_CONST_VS)
commit_vs_constants(device);
if (context->commit & NINE_STATE_COMMIT_CONST_PS)
commit_ps_constants(device);
if (context->commit & NINE_STATE_COMMIT_VS)
commit_vs(device);
if (context->commit & NINE_STATE_COMMIT_PS)
commit_ps(device);
context->commit = 0;
if (unlikely(context->changed.ucp)) {
pipe->set_clip_state(pipe, &context->clip);
context->changed.ucp = FALSE;
}
if (unlikely(group & NINE_STATE_RARE)) {
if (group & NINE_STATE_SCISSOR)
commit_scissor(device);
if (group & NINE_STATE_BLEND_COLOR) {
struct pipe_blend_color color;
d3dcolor_to_rgba(&color.color[0], context->rs[D3DRS_BLENDFACTOR]);
pipe->set_blend_color(pipe, &color);
}
if (group & NINE_STATE_SAMPLE_MASK) {
if (context->rt[0]->desc.MultiSampleType <= D3DMULTISAMPLE_NONMASKABLE) {
pipe->set_sample_mask(pipe, ~0);
} else {
pipe->set_sample_mask(pipe, context->rs[D3DRS_MULTISAMPLEMASK]);
}
}
if (group & NINE_STATE_STENCIL_REF) {
struct pipe_stencil_ref ref;
ref.ref_value[0] = context->rs[D3DRS_STENCILREF];
ref.ref_value[1] = ref.ref_value[0];
pipe->set_stencil_ref(pipe, &ref);
}
}
context->changed.group &=
(NINE_STATE_FF | NINE_STATE_VS_CONST | NINE_STATE_PS_CONST);
DBG("finished\n");
}
#define RESZ_CODE 0x7fa05000
static void
NineDevice9_ResolveZ( struct NineDevice9 *device )
{
struct nine_context *context = &device->context;
const struct util_format_description *desc;
struct NineSurface9 *source = context->ds;
struct NineBaseTexture9 *destination = context->texture[0];
struct pipe_resource *src, *dst;
struct pipe_blit_info blit;
DBG("RESZ resolve\n");
if (!source || !destination ||
destination->base.type != D3DRTYPE_TEXTURE)
return;
src = source->base.resource;
dst = destination->base.resource;
if (!src || !dst)
return;
/* check dst is depth format. we know already for src */
desc = util_format_description(dst->format);
if (desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)
return;
memset(&blit, 0, sizeof(blit));
blit.src.resource = src;
blit.src.level = 0;
blit.src.format = src->format;
blit.src.box.z = 0;
blit.src.box.depth = 1;
blit.src.box.x = 0;
blit.src.box.y = 0;
blit.src.box.width = src->width0;
blit.src.box.height = src->height0;
blit.dst.resource = dst;
blit.dst.level = 0;
blit.dst.format = dst->format;
blit.dst.box.z = 0;
blit.dst.box.depth = 1;
blit.dst.box.x = 0;
blit.dst.box.y = 0;
blit.dst.box.width = dst->width0;
blit.dst.box.height = dst->height0;
blit.mask = PIPE_MASK_ZS;
blit.filter = PIPE_TEX_FILTER_NEAREST;
blit.scissor_enable = FALSE;
device->pipe->blit(device->pipe, &blit);
}
#define ALPHA_TO_COVERAGE_ENABLE MAKEFOURCC('A', '2', 'M', '1')
#define ALPHA_TO_COVERAGE_DISABLE MAKEFOURCC('A', '2', 'M', '0')
void
nine_context_set_render_state(struct NineDevice9 *device,
D3DRENDERSTATETYPE State,
DWORD Value)
{
struct nine_context *context = &device->context;
/* Amd hacks (equivalent to GL extensions) */
if (unlikely(State == D3DRS_POINTSIZE)) {
if (Value == RESZ_CODE) {
NineDevice9_ResolveZ(device);
return;
}
if (Value == ALPHA_TO_COVERAGE_ENABLE ||
Value == ALPHA_TO_COVERAGE_DISABLE) {
context->rs[NINED3DRS_ALPHACOVERAGE] = (Value == ALPHA_TO_COVERAGE_ENABLE);
context->changed.group |= NINE_STATE_BLEND;
return;
}
}
/* NV hack */
if (unlikely(State == D3DRS_ADAPTIVETESS_Y)) {
if (Value == D3DFMT_ATOC || (Value == D3DFMT_UNKNOWN && context->rs[NINED3DRS_ALPHACOVERAGE])) {
context->rs[NINED3DRS_ALPHACOVERAGE] = (Value == D3DFMT_ATOC) ? 3 : 0;
context->rs[NINED3DRS_ALPHACOVERAGE] &= context->rs[D3DRS_ALPHATESTENABLE] ? 3 : 2;
context->changed.group |= NINE_STATE_BLEND;
return;
}
}
if (unlikely(State == D3DRS_ALPHATESTENABLE && (context->rs[NINED3DRS_ALPHACOVERAGE] & 2))) {
DWORD alphacoverage_prev = context->rs[NINED3DRS_ALPHACOVERAGE];
context->rs[NINED3DRS_ALPHACOVERAGE] = (Value ? 3 : 2);
if (context->rs[NINED3DRS_ALPHACOVERAGE] != alphacoverage_prev)
context->changed.group |= NINE_STATE_BLEND;
}
context->rs[State] = nine_fix_render_state_value(State, Value);
context->changed.group |= nine_render_state_group[State];
}
void
nine_context_set_texture(struct NineDevice9 *device,
DWORD Stage,
struct NineBaseTexture9 *tex)
{
struct nine_context *context = &device->context;
context->samplers_shadow &= ~(1 << Stage);
if (tex)
context->samplers_shadow |= tex->shadow << Stage;
nine_bind(&context->texture[Stage], tex);
context->changed.group |= NINE_STATE_TEXTURE;
}
void
nine_context_set_sampler_state(struct NineDevice9 *device,
DWORD Sampler,
D3DSAMPLERSTATETYPE Type,
DWORD Value)
{
struct nine_context *context = &device->context;
if (unlikely(!nine_check_sampler_state_value(Type, Value)))
return;
context->samp[Sampler][Type] = Value;
context->changed.group |= NINE_STATE_SAMPLER;
context->changed.sampler[Sampler] |= 1 << Type;
}
void
nine_context_set_stream_source(struct NineDevice9 *device,
UINT StreamNumber,
struct NineVertexBuffer9 *pVBuf9,
UINT OffsetInBytes,
UINT Stride)
{
struct nine_context *context = &device->context;
const unsigned i = StreamNumber;
context->changed.vtxbuf |= 1 << StreamNumber;
if (pVBuf9) {
context->vtxbuf[i].stride = Stride;
context->vtxbuf[i].buffer_offset = OffsetInBytes;
}
pipe_resource_reference(&context->vtxbuf[i].buffer,
pVBuf9 ? NineVertexBuffer9_GetResource(pVBuf9) : NULL);
}
void
nine_context_set_stream_source_freq(struct NineDevice9 *device,
UINT StreamNumber,
UINT Setting)
{
struct nine_context *context = &device->context;
context->stream_freq[StreamNumber] = Setting;
if (Setting & D3DSTREAMSOURCE_INSTANCEDATA)
context->stream_instancedata_mask |= 1 << StreamNumber;
else
context->stream_instancedata_mask &= ~(1 << StreamNumber);
if (StreamNumber != 0)
context->changed.group |= NINE_STATE_STREAMFREQ;
}
void
nine_context_set_indices(struct NineDevice9 *device,
struct NineIndexBuffer9 *idxbuf)
{
struct nine_context *context = &device->context;
const struct pipe_index_buffer *pipe_idxbuf;
if (idxbuf) {
pipe_idxbuf = NineIndexBuffer9_GetBuffer(idxbuf);
context->idxbuf.index_size = pipe_idxbuf->index_size;
pipe_resource_reference(&context->idxbuf.buffer, pipe_idxbuf->buffer);
context->idxbuf.offset = pipe_idxbuf->offset;
context->idxbuf.user_buffer = NULL;
} else
pipe_resource_reference(&context->idxbuf.buffer, NULL);
context->changed.group |= NINE_STATE_IDXBUF;
}
void
nine_context_set_vertex_declaration(struct NineDevice9 *device,
struct NineVertexDeclaration9 *vdecl)
{
struct nine_context *context = &device->context;
BOOL was_programmable_vs = context->programmable_vs;
nine_bind(&context->vdecl, vdecl);
context->programmable_vs = context->vs && !(context->vdecl && context->vdecl->position_t);
if (was_programmable_vs != context->programmable_vs) {
context->commit |= NINE_STATE_COMMIT_CONST_VS;
context->changed.group |= NINE_STATE_VS;
}
context->changed.group |= NINE_STATE_VDECL;
}
void
nine_context_set_vertex_shader(struct NineDevice9 *device,
struct NineVertexShader9 *pShader)
{
struct nine_context *context = &device->context;
BOOL was_programmable_vs = context->programmable_vs;
nine_bind(&context->vs, pShader);
context->programmable_vs = context->vs && !(context->vdecl && context->vdecl->position_t);
/* ff -> non-ff: commit back non-ff constants */
if (!was_programmable_vs && context->programmable_vs)
context->commit |= NINE_STATE_COMMIT_CONST_VS;
context->changed.group |= NINE_STATE_VS;
}
void
nine_context_set_vertex_shader_constant_f(struct NineDevice9 *device,
UINT StartRegister,
const float *pConstantData,
UINT Vector4fCount)
{
struct nine_context *context = &device->context;
float *vs_const_f = device->may_swvp ? context->vs_const_f_swvp : context->vs_const_f;
memcpy(&vs_const_f[StartRegister * 4],
pConstantData,
Vector4fCount * 4 * sizeof(context->vs_const_f[0]));
if (device->may_swvp) {
Vector4fCount = MIN2(StartRegister + Vector4fCount, NINE_MAX_CONST_F) - StartRegister;
if (StartRegister < NINE_MAX_CONST_F)
memcpy(&context->vs_const_f[StartRegister * 4],
pConstantData,
Vector4fCount * 4 * sizeof(context->vs_const_f[0]));
}
context->changed.vs_const_f = TRUE;
context->changed.group |= NINE_STATE_VS_CONST;
}
void
nine_context_set_vertex_shader_constant_i(struct NineDevice9 *device,
UINT StartRegister,
const int *pConstantData,
UINT Vector4iCount)
{
struct nine_context *context = &device->context;
int i;
if (device->driver_caps.vs_integer) {
memcpy(&context->vs_const_i[4 * StartRegister],
pConstantData,
Vector4iCount * sizeof(int[4]));
} else {
for (i = 0; i < Vector4iCount; i++) {
context->vs_const_i[4 * (StartRegister + i)] = fui((float)(pConstantData[4 * i]));
context->vs_const_i[4 * (StartRegister + i) + 1] = fui((float)(pConstantData[4 * i + 1]));
context->vs_const_i[4 * (StartRegister + i) + 2] = fui((float)(pConstantData[4 * i + 2]));
context->vs_const_i[4 * (StartRegister + i) + 3] = fui((float)(pConstantData[4 * i + 3]));
}
}
context->changed.vs_const_i = TRUE;
context->changed.group |= NINE_STATE_VS_CONST;
}
void
nine_context_set_vertex_shader_constant_b(struct NineDevice9 *device,
UINT StartRegister,
const BOOL *pConstantData,
UINT BoolCount)
{
struct nine_context *context = &device->context;
int i;
uint32_t bool_true = device->driver_caps.vs_integer ? 0xFFFFFFFF : fui(1.0f);
for (i = 0; i < BoolCount; i++)
context->vs_const_b[StartRegister + i] = pConstantData[i] ? bool_true : 0;
context->changed.vs_const_b = TRUE;
context->changed.group |= NINE_STATE_VS_CONST;
}
void
nine_context_set_pixel_shader(struct NineDevice9 *device,
struct NinePixelShader9* ps)
{
struct nine_context *context = &device->context;
unsigned old_mask = context->ps ? context->ps->rt_mask : 1;
unsigned mask;
/* ff -> non-ff: commit back non-ff constants */
if (!context->ps && ps)
context->commit |= NINE_STATE_COMMIT_CONST_PS;
nine_bind(&context->ps, ps);
context->changed.group |= NINE_STATE_PS;
mask = context->ps ? context->ps->rt_mask : 1;
/* We need to update cbufs if the pixel shader would
* write to different render targets */
if (mask != old_mask)
context->changed.group |= NINE_STATE_FB;
}
void
nine_context_set_pixel_shader_constant_f(struct NineDevice9 *device,
UINT StartRegister,
const float *pConstantData,
UINT Vector4fCount)
{
struct nine_context *context = &device->context;
memcpy(&context->ps_const_f[StartRegister * 4],
pConstantData,
Vector4fCount * 4 * sizeof(context->ps_const_f[0]));
context->changed.ps_const_f = TRUE;
context->changed.group |= NINE_STATE_PS_CONST;
}
void
nine_context_set_pixel_shader_constant_i(struct NineDevice9 *device,
UINT StartRegister,
const int *pConstantData,
UINT Vector4iCount)
{
struct nine_context *context = &device->context;
int i;
if (device->driver_caps.ps_integer) {
memcpy(&context->ps_const_i[StartRegister][0],
pConstantData,
Vector4iCount * sizeof(context->ps_const_i[0]));
} else {
for (i = 0; i < Vector4iCount; i++) {
context->ps_const_i[StartRegister+i][0] = fui((float)(pConstantData[4*i]));
context->ps_const_i[StartRegister+i][1] = fui((float)(pConstantData[4*i+1]));
context->ps_const_i[StartRegister+i][2] = fui((float)(pConstantData[4*i+2]));
context->ps_const_i[StartRegister+i][3] = fui((float)(pConstantData[4*i+3]));
}
}
context->changed.ps_const_i = TRUE;
context->changed.group |= NINE_STATE_PS_CONST;
}
void
nine_context_set_pixel_shader_constant_b(struct NineDevice9 *device,
UINT StartRegister,
const BOOL *pConstantData,
UINT BoolCount)
{
struct nine_context *context = &device->context;
int i;
uint32_t bool_true = device->driver_caps.ps_integer ? 0xFFFFFFFF : fui(1.0f);
for (i = 0; i < BoolCount; i++)
context->ps_const_b[StartRegister + i] = pConstantData[i] ? bool_true : 0;
context->changed.ps_const_b = TRUE;
context->changed.group |= NINE_STATE_PS_CONST;
}
void
nine_context_set_render_target(struct NineDevice9 *device,
DWORD RenderTargetIndex,
struct NineSurface9 *rt)
{
struct nine_context *context = &device->context;
const unsigned i = RenderTargetIndex;
if (i == 0) {
context->viewport.X = 0;
context->viewport.Y = 0;
context->viewport.Width = rt->desc.Width;
context->viewport.Height = rt->desc.Height;
context->viewport.MinZ = 0.0f;
context->viewport.MaxZ = 1.0f;
context->scissor.minx = 0;
context->scissor.miny = 0;
context->scissor.maxx = rt->desc.Width;
context->scissor.maxy = rt->desc.Height;
context->changed.group |= NINE_STATE_VIEWPORT | NINE_STATE_SCISSOR | NINE_STATE_MULTISAMPLE;
if (context->rt[0] &&
(context->rt[0]->desc.MultiSampleType <= D3DMULTISAMPLE_NONMASKABLE) !=
(rt->desc.MultiSampleType <= D3DMULTISAMPLE_NONMASKABLE))
context->changed.group |= NINE_STATE_SAMPLE_MASK;
}
if (context->rt[i] != rt) {
nine_bind(&context->rt[i], rt);
context->changed.group |= NINE_STATE_FB;
}
}
void
nine_context_set_depth_stencil(struct NineDevice9 *device,
struct NineSurface9 *ds)
{
struct nine_context *context = &device->context;
nine_bind(&context->ds, ds);
context->changed.group |= NINE_STATE_FB;
}
void
nine_context_set_viewport(struct NineDevice9 *device,
const D3DVIEWPORT9 *viewport)
{
struct nine_context *context = &device->context;
context->viewport = *viewport;
context->changed.group |= NINE_STATE_VIEWPORT;
}
void
nine_context_set_scissor(struct NineDevice9 *device,
const struct pipe_scissor_state *scissor)
{
struct nine_context *context = &device->context;
context->scissor = *scissor;
context->changed.group |= NINE_STATE_SCISSOR;
}
void
nine_context_set_transform(struct NineDevice9 *device,
D3DTRANSFORMSTATETYPE State,
const D3DMATRIX *pMatrix)
{
struct nine_context *context = &device->context;
D3DMATRIX *M = nine_state_access_transform(&context->ff, State, TRUE);
*M = *pMatrix;
context->ff.changed.transform[State / 32] |= 1 << (State % 32);
context->changed.group |= NINE_STATE_FF;
}
void
nine_context_set_material(struct NineDevice9 *device,
const D3DMATERIAL9 *pMaterial)
{
struct nine_context *context = &device->context;
context->ff.material = *pMaterial;
context->changed.group |= NINE_STATE_FF_MATERIAL;
}
void
nine_context_set_light(struct NineDevice9 *device,
DWORD Index,
const D3DLIGHT9 *pLight)
{
struct nine_context *context = &device->context;
(void)nine_state_set_light(&context->ff, Index, pLight);
context->changed.group |= NINE_STATE_FF_LIGHTING;
}
void
nine_context_light_enable(struct NineDevice9 *device,
DWORD Index,
BOOL Enable)
{
struct nine_context *context = &device->context;
nine_state_light_enable(&context->ff, &context->changed.group, Index, Enable);
}
void
nine_context_set_texture_stage_state(struct NineDevice9 *device,
DWORD Stage,
D3DTEXTURESTAGESTATETYPE Type,
DWORD Value)
{
struct nine_context *context = &device->context;
int bumpmap_index = -1;
context->ff.tex_stage[Stage][Type] = Value;
switch (Type) {
case D3DTSS_BUMPENVMAT00:
bumpmap_index = 4 * Stage;
break;
case D3DTSS_BUMPENVMAT01:
bumpmap_index = 4 * Stage + 1;
break;
case D3DTSS_BUMPENVMAT10:
bumpmap_index = 4 * Stage + 2;
break;
case D3DTSS_BUMPENVMAT11:
bumpmap_index = 4 * Stage + 3;
break;
case D3DTSS_BUMPENVLSCALE:
bumpmap_index = 4 * 8 + 2 * Stage;
break;
case D3DTSS_BUMPENVLOFFSET:
bumpmap_index = 4 * 8 + 2 * Stage + 1;
break;
case D3DTSS_TEXTURETRANSFORMFLAGS:
context->changed.group |= NINE_STATE_PS1X_SHADER;
break;
default:
break;
}
if (bumpmap_index >= 0) {
context->bumpmap_vars[bumpmap_index] = Value;
context->changed.group |= NINE_STATE_PS_CONST;
}
context->changed.group |= NINE_STATE_FF_PSSTAGES;
context->ff.changed.tex_stage[Stage][Type / 32] |= 1 << (Type % 32);
}
void
nine_context_set_clip_plane(struct NineDevice9 *device,
DWORD Index,
const float *pPlane)
{
struct nine_context *context = &device->context;
memcpy(&context->clip.ucp[Index][0], pPlane, sizeof(context->clip.ucp[0]));
context->changed.ucp = TRUE;
}
void
nine_context_apply_stateblock(struct NineDevice9 *device,
const struct nine_state *src)
{
struct nine_context *context = &device->context;
int i;
context->changed.group |= src->changed.group;
for (i = 0; i < ARRAY_SIZE(src->changed.rs); ++i) {
uint32_t m = src->changed.rs[i];
while (m) {
const int r = ffs(m) - 1;
m &= ~(1 << r);
context->rs[i * 32 + r] = nine_fix_render_state_value(i * 32 + r, src->rs_advertised[i * 32 + r]);
}
}
/* Textures */
if (src->changed.texture) {
uint32_t m = src->changed.texture;
unsigned s;
context->samplers_shadow &= ~m;
for (s = 0; m; ++s, m >>= 1) {
struct NineBaseTexture9 *tex = src->texture[s];
if (!(m & 1))
continue;
if (tex)
context->samplers_shadow |= tex->shadow << s;
nine_bind(&context->texture[s], src->texture[s]);
}
}
/* Sampler state */
if (src->changed.group & NINE_STATE_SAMPLER) {
unsigned s;
for (s = 0; s < NINE_MAX_SAMPLERS; ++s) {
uint32_t m = src->changed.sampler[s];
while (m) {
const int i = ffs(m) - 1;
m &= ~(1 << i);
if (nine_check_sampler_state_value(i, src->samp_advertised[s][i]))
context->samp[s][i] = src->samp_advertised[s][i];
}
context->changed.sampler[s] |= src->changed.sampler[s];
}
}
/* Vertex buffers */
if (src->changed.vtxbuf | src->changed.stream_freq) {
uint32_t m = src->changed.vtxbuf | src->changed.stream_freq;
for (i = 0; m; ++i, m >>= 1) {
if (src->changed.vtxbuf & (1 << i)) {
if (src->stream[i]) {
context->vtxbuf[i].buffer_offset = src->vtxbuf[i].buffer_offset;
pipe_resource_reference(&context->vtxbuf[i].buffer,
src->stream[i] ? NineVertexBuffer9_GetResource(src->stream[i]) : NULL);
context->vtxbuf[i].stride = src->vtxbuf[i].stride;
}
}
if (src->changed.stream_freq & (1 << i)) {
context->stream_freq[i] = src->stream_freq[i];
if (src->stream_freq[i] & D3DSTREAMSOURCE_INSTANCEDATA)
context->stream_instancedata_mask |= 1 << i;
else
context->stream_instancedata_mask &= ~(1 << i);
}
}
context->changed.vtxbuf |= src->changed.vtxbuf;
}
/* Index buffer */
if (src->changed.group & NINE_STATE_IDXBUF)
nine_context_set_indices(device, src->idxbuf);
/* Vertex declaration */
if ((src->changed.group & NINE_STATE_VDECL) && src->vdecl)
nine_context_set_vertex_declaration(device, src->vdecl);
/* Vertex shader */
if (src->changed.group & NINE_STATE_VS)
nine_bind(&context->vs, src->vs);
context->programmable_vs = context->vs && !(context->vdecl && context->vdecl->position_t);
/* Pixel shader */
if (src->changed.group & NINE_STATE_PS)
nine_bind(&context->ps, src->ps);
/* Vertex constants */
if (src->changed.group & NINE_STATE_VS_CONST) {
struct nine_range *r;
if (device->may_swvp) {
for (r = src->changed.vs_const_f; r; r = r->next) {
int bgn = r->bgn;
int end = r->end;
memcpy(&context->vs_const_f_swvp[bgn * 4],
&src->vs_const_f[bgn * 4],
(end - bgn) * 4 * sizeof(float));
if (bgn < device->max_vs_const_f) {
end = MIN2(end, device->max_vs_const_f);
memcpy(&context->vs_const_f[bgn * 4],
&src->vs_const_f[bgn * 4],
(end - bgn) * 4 * sizeof(float));
}
}
} else {
for (r = src->changed.vs_const_f; r; r = r->next) {
memcpy(&context->vs_const_f[r->bgn * 4],
&src->vs_const_f[r->bgn * 4],
(r->end - r->bgn) * 4 * sizeof(float));
}
}
for (r = src->changed.vs_const_i; r; r = r->next) {
memcpy(&context->vs_const_i[r->bgn * 4],
&src->vs_const_i[r->bgn * 4],
(r->end - r->bgn) * 4 * sizeof(int));
}
for (r = src->changed.vs_const_b; r; r = r->next) {
memcpy(&context->vs_const_b[r->bgn],
&src->vs_const_b[r->bgn],
(r->end - r->bgn) * sizeof(int));
}
context->changed.vs_const_f = !!src->changed.vs_const_f;
context->changed.vs_const_i = !!src->changed.vs_const_i;
context->changed.vs_const_b = !!src->changed.vs_const_b;
}
/* Pixel constants */
if (src->changed.group & NINE_STATE_PS_CONST) {
struct nine_range *r;
for (r = src->changed.ps_const_f; r; r = r->next) {
memcpy(&context->ps_const_f[r->bgn * 4],
&src->ps_const_f[r->bgn * 4],
(r->end - r->bgn) * 4 * sizeof(float));
}
if (src->changed.ps_const_i) {
uint16_t m = src->changed.ps_const_i;
for (i = ffs(m) - 1, m >>= i; m; ++i, m >>= 1)
if (m & 1)
memcpy(context->ps_const_i[i], src->ps_const_i[i], 4 * sizeof(int));
}
if (src->changed.ps_const_b) {
uint16_t m = src->changed.ps_const_b;
for (i = ffs(m) - 1, m >>= i; m; ++i, m >>= 1)
if (m & 1)
context->ps_const_b[i] = src->ps_const_b[i];
}
context->changed.ps_const_f = !!src->changed.ps_const_f;
context->changed.ps_const_i = !!src->changed.ps_const_i;
context->changed.ps_const_b = !!src->changed.ps_const_b;
}
/* Viewport */
if (src->changed.group & NINE_STATE_VIEWPORT)
context->viewport = src->viewport;
/* Scissor */
if (src->changed.group & NINE_STATE_SCISSOR)
context->scissor = src->scissor;
/* User Clip Planes */
if (src->changed.ucp) {
for (i = 0; i < PIPE_MAX_CLIP_PLANES; ++i)
if (src->changed.ucp & (1 << i))
memcpy(context->clip.ucp[i],
src->clip.ucp[i], sizeof(src->clip.ucp[0]));
context->changed.ucp = TRUE;
}
if (!(src->changed.group & NINE_STATE_FF))
return;
/* Fixed function state. */
if (src->changed.group & NINE_STATE_FF_MATERIAL)
context->ff.material = src->ff.material;
if (src->changed.group & NINE_STATE_FF_PSSTAGES) {
unsigned s;
for (s = 0; s < NINE_MAX_TEXTURE_STAGES; ++s) {
for (i = 0; i < NINED3DTSS_COUNT; ++i)
if (src->ff.changed.tex_stage[s][i / 32] & (1 << (i % 32)))
context->ff.tex_stage[s][i] = src->ff.tex_stage[s][i];
}
}
if (src->changed.group & NINE_STATE_FF_LIGHTING) {
unsigned num_lights = MAX2(context->ff.num_lights, src->ff.num_lights);
/* Can happen if the stateblock had recorded the creation of
* new lights. */
if (context->ff.num_lights < num_lights) {
context->ff.light = REALLOC(context->ff.light,
context->ff.num_lights * sizeof(D3DLIGHT9),
num_lights * sizeof(D3DLIGHT9));
memset(&context->ff.light[context->ff.num_lights], 0, (num_lights - context->ff.num_lights) * sizeof(D3DLIGHT9));
for (i = context->ff.num_lights; i < num_lights; ++i)
context->ff.light[i].Type = (D3DLIGHTTYPE)NINED3DLIGHT_INVALID;
context->ff.num_lights = num_lights;
}
/* src->ff.num_lights < num_lights has been handled before */
assert (src->ff.num_lights == num_lights);
for (i = 0; i < num_lights; ++i)
if (src->ff.light[i].Type != NINED3DLIGHT_INVALID)
context->ff.light[i] = src->ff.light[i];
memcpy(context->ff.active_light, src->ff.active_light, sizeof(src->ff.active_light) );
context->ff.num_lights_active = src->ff.num_lights_active;
}
if (src->changed.group & NINE_STATE_FF_VSTRANSF) {
for (i = 0; i < ARRAY_SIZE(src->ff.changed.transform); ++i) {
unsigned s;
if (!src->ff.changed.transform[i])
continue;
for (s = i * 32; s < (i * 32 + 32); ++s) {
if (!(src->ff.changed.transform[i] & (1 << (s % 32))))
continue;
*nine_state_access_transform(&context->ff, s, TRUE) =
*nine_state_access_transform( /* const because !alloc */
(struct nine_ff_state *)&src->ff, s, FALSE);
}
context->ff.changed.transform[i] |= src->ff.changed.transform[i];
}
}
}
static void
nine_update_state_framebuffer_clear(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
validate_textures(device);
if (context->changed.group & NINE_STATE_FB)
update_framebuffer(device, TRUE);
}
/* Checks were already done before the call */
void
nine_context_clear_fb(struct NineDevice9 *device,
DWORD Count,
const D3DRECT *pRects,
DWORD Flags,
D3DCOLOR Color,
float Z,
DWORD Stencil)
{
struct nine_context *context = &device->context;
const int sRGB = context->rs[D3DRS_SRGBWRITEENABLE] ? 1 : 0;
struct pipe_surface *cbuf, *zsbuf;
struct pipe_context *pipe = device->pipe;
struct NineSurface9 *zsbuf_surf = context->ds;
struct NineSurface9 *rt;
unsigned bufs = 0;
unsigned r, i;
union pipe_color_union rgba;
unsigned rt_mask = 0;
D3DRECT rect;
nine_update_state_framebuffer_clear(device);
if (Flags & D3DCLEAR_TARGET) bufs |= PIPE_CLEAR_COLOR;
/* Ignore Z buffer if not bound */
if (context->pipe_data.fb.zsbuf != NULL) {
if (Flags & D3DCLEAR_ZBUFFER) bufs |= PIPE_CLEAR_DEPTH;
if (Flags & D3DCLEAR_STENCIL) bufs |= PIPE_CLEAR_STENCIL;
}
if (!bufs)
return;
d3dcolor_to_pipe_color_union(&rgba, Color);
rect.x1 = context->viewport.X;
rect.y1 = context->viewport.Y;
rect.x2 = context->viewport.Width + rect.x1;
rect.y2 = context->viewport.Height + rect.y1;
/* Both rectangles apply, which is weird, but that's D3D9. */
if (context->rs[D3DRS_SCISSORTESTENABLE]) {
rect.x1 = MAX2(rect.x1, context->scissor.minx);
rect.y1 = MAX2(rect.y1, context->scissor.miny);
rect.x2 = MIN2(rect.x2, context->scissor.maxx);
rect.y2 = MIN2(rect.y2, context->scissor.maxy);
}
if (Count) {
/* Maybe apps like to specify a large rect ? */
if (pRects[0].x1 <= rect.x1 && pRects[0].x2 >= rect.x2 &&
pRects[0].y1 <= rect.y1 && pRects[0].y2 >= rect.y2) {
DBG("First rect covers viewport.\n");
Count = 0;
pRects = NULL;
}
}
if (rect.x1 >= context->pipe_data.fb.width || rect.y1 >= context->pipe_data.fb.height)
return;
for (i = 0; i < device->caps.NumSimultaneousRTs; ++i) {
if (context->rt[i] && context->rt[i]->desc.Format != D3DFMT_NULL)
rt_mask |= 1 << i;
}
/* fast path, clears everything at once */
if (!Count &&
(!(bufs & PIPE_CLEAR_COLOR) || (rt_mask == context->rt_mask)) &&
rect.x1 == 0 && rect.y1 == 0 &&
/* Case we clear only render target. Check clear region vs rt. */
((!(bufs & (PIPE_CLEAR_DEPTH | PIPE_CLEAR_STENCIL)) &&
rect.x2 >= context->pipe_data.fb.width &&
rect.y2 >= context->pipe_data.fb.height) ||
/* Case we clear depth buffer (and eventually rt too).
* depth buffer size is always >= rt size. Compare to clear region */
((bufs & (PIPE_CLEAR_DEPTH | PIPE_CLEAR_STENCIL)) &&
rect.x2 >= zsbuf_surf->desc.Width &&
rect.y2 >= zsbuf_surf->desc.Height))) {
DBG("Clear fast path\n");
pipe->clear(pipe, bufs, &rgba, Z, Stencil);
return;
}
if (!Count) {
Count = 1;
pRects = &rect;
}
for (i = 0; i < device->caps.NumSimultaneousRTs; ++i) {
rt = context->rt[i];
if (!rt || rt->desc.Format == D3DFMT_NULL ||
!(bufs & PIPE_CLEAR_COLOR))
continue; /* save space, compiler should hoist this */
cbuf = NineSurface9_GetSurface(rt, sRGB);
for (r = 0; r < Count; ++r) {
/* Don't trust users to pass these in the right order. */
unsigned x1 = MIN2(pRects[r].x1, pRects[r].x2);
unsigned y1 = MIN2(pRects[r].y1, pRects[r].y2);
unsigned x2 = MAX2(pRects[r].x1, pRects[r].x2);
unsigned y2 = MAX2(pRects[r].y1, pRects[r].y2);
#ifndef NINE_LAX
/* Drop negative rectangles (like wine expects). */
if (pRects[r].x1 > pRects[r].x2) continue;
if (pRects[r].y1 > pRects[r].y2) continue;
#endif
x1 = MAX2(x1, rect.x1);
y1 = MAX2(y1, rect.y1);
x2 = MIN3(x2, rect.x2, rt->desc.Width);
y2 = MIN3(y2, rect.y2, rt->desc.Height);
DBG("Clearing (%u..%u)x(%u..%u)\n", x1, x2, y1, y2);
pipe->clear_render_target(pipe, cbuf, &rgba,
x1, y1, x2 - x1, y2 - y1, false);
}
}
if (!(bufs & PIPE_CLEAR_DEPTHSTENCIL))
return;
bufs &= PIPE_CLEAR_DEPTHSTENCIL;
for (r = 0; r < Count; ++r) {
unsigned x1 = MIN2(pRects[r].x1, pRects[r].x2);
unsigned y1 = MIN2(pRects[r].y1, pRects[r].y2);
unsigned x2 = MAX2(pRects[r].x1, pRects[r].x2);
unsigned y2 = MAX2(pRects[r].y1, pRects[r].y2);
#ifndef NINE_LAX
/* Drop negative rectangles. */
if (pRects[r].x1 > pRects[r].x2) continue;
if (pRects[r].y1 > pRects[r].y2) continue;
#endif
x1 = MIN2(x1, rect.x1);
y1 = MIN2(y1, rect.y1);
x2 = MIN3(x2, rect.x2, zsbuf_surf->desc.Width);
y2 = MIN3(y2, rect.y2, zsbuf_surf->desc.Height);
zsbuf = NineSurface9_GetSurface(zsbuf_surf, 0);
assert(zsbuf);
pipe->clear_depth_stencil(pipe, zsbuf, bufs, Z, Stencil,
x1, y1, x2 - x1, y2 - y1, false);
}
return;
}
static inline void
init_draw_info(struct pipe_draw_info *info,
struct NineDevice9 *dev, D3DPRIMITIVETYPE type, UINT count)
{
info->mode = d3dprimitivetype_to_pipe_prim(type);
info->count = prim_count_to_vertex_count(type, count);
info->start_instance = 0;
info->instance_count = 1;
if (dev->context.stream_instancedata_mask & dev->context.stream_usage_mask)
info->instance_count = MAX2(dev->context.stream_freq[0] & 0x7FFFFF, 1);
info->primitive_restart = FALSE;
info->restart_index = 0;
info->count_from_stream_output = NULL;
info->indirect = NULL;
info->indirect_params = NULL;
}
void
nine_context_draw_primitive(struct NineDevice9 *device,
D3DPRIMITIVETYPE PrimitiveType,
UINT StartVertex,
UINT PrimitiveCount)
{
struct pipe_draw_info info;
nine_update_state(device);
init_draw_info(&info, device, PrimitiveType, PrimitiveCount);
info.indexed = FALSE;
info.start = StartVertex;
info.index_bias = 0;
info.min_index = info.start;
info.max_index = info.count - 1;
device->pipe->draw_vbo(device->pipe, &info);
}
void
nine_context_draw_indexed_primitive(struct NineDevice9 *device,
D3DPRIMITIVETYPE PrimitiveType,
INT BaseVertexIndex,
UINT MinVertexIndex,
UINT NumVertices,
UINT StartIndex,
UINT PrimitiveCount)
{
struct pipe_draw_info info;
nine_update_state(device);
init_draw_info(&info, device, PrimitiveType, PrimitiveCount);
info.indexed = TRUE;
info.start = StartIndex;
info.index_bias = BaseVertexIndex;
/* These don't include index bias: */
info.min_index = MinVertexIndex;
info.max_index = MinVertexIndex + NumVertices - 1;
device->pipe->draw_vbo(device->pipe, &info);
}
void
nine_context_draw_primitive_from_vtxbuf(struct NineDevice9 *device,
D3DPRIMITIVETYPE PrimitiveType,
UINT PrimitiveCount,
struct pipe_vertex_buffer *vtxbuf)
{
struct pipe_draw_info info;
nine_update_state(device);
init_draw_info(&info, device, PrimitiveType, PrimitiveCount);
info.indexed = FALSE;
info.start = 0;
info.index_bias = 0;
info.min_index = 0;
info.max_index = info.count - 1;
device->pipe->set_vertex_buffers(device->pipe, 0, 1, vtxbuf);
device->pipe->draw_vbo(device->pipe, &info);
}
void
nine_context_draw_indexed_primitive_from_vtxbuf_idxbuf(struct NineDevice9 *device,
D3DPRIMITIVETYPE PrimitiveType,
UINT MinVertexIndex,
UINT NumVertices,
UINT PrimitiveCount,
struct pipe_vertex_buffer *vbuf,
struct pipe_index_buffer *ibuf)
{
struct pipe_draw_info info;
nine_update_state(device);
init_draw_info(&info, device, PrimitiveType, PrimitiveCount);
info.indexed = TRUE;
info.start = 0;
info.index_bias = 0;
info.min_index = MinVertexIndex;
info.max_index = MinVertexIndex + NumVertices - 1;
device->pipe->set_vertex_buffers(device->pipe, 0, 1, vbuf);
device->pipe->set_index_buffer(device->pipe, ibuf);
device->pipe->draw_vbo(device->pipe, &info);
}
struct pipe_query *
nine_context_create_query(struct NineDevice9 *device, unsigned query_type)
{
return device->pipe->create_query(device->pipe, query_type, 0);
}
void
nine_context_destroy_query(struct NineDevice9 *device, struct pipe_query *query)
{
device->pipe->destroy_query(device->pipe, query);
}
void
nine_context_begin_query(struct NineDevice9 *device, struct pipe_query *query)
{
(void) device->pipe->begin_query(device->pipe, query);
}
void
nine_context_end_query(struct NineDevice9 *device, struct pipe_query *query)
{
(void) device->pipe->end_query(device->pipe, query);
}
boolean
nine_context_get_query_result(struct NineDevice9 *device, struct pipe_query *query,
boolean flush, boolean wait,
union pipe_query_result *result)
{
(void) flush;
return device->pipe->get_query_result(device->pipe, query, wait, result);
}
/* State defaults */
static const DWORD nine_render_state_defaults[NINED3DRS_LAST + 1] =
{
/* [D3DRS_ZENABLE] = D3DZB_TRUE; wine: auto_depth_stencil */
[D3DRS_ZENABLE] = D3DZB_FALSE,
[D3DRS_FILLMODE] = D3DFILL_SOLID,
[D3DRS_SHADEMODE] = D3DSHADE_GOURAUD,
/* [D3DRS_LINEPATTERN] = 0x00000000, */
[D3DRS_ZWRITEENABLE] = TRUE,
[D3DRS_ALPHATESTENABLE] = FALSE,
[D3DRS_LASTPIXEL] = TRUE,
[D3DRS_SRCBLEND] = D3DBLEND_ONE,
[D3DRS_DESTBLEND] = D3DBLEND_ZERO,
[D3DRS_CULLMODE] = D3DCULL_CCW,
[D3DRS_ZFUNC] = D3DCMP_LESSEQUAL,
[D3DRS_ALPHAFUNC] = D3DCMP_ALWAYS,
[D3DRS_ALPHAREF] = 0,
[D3DRS_DITHERENABLE] = FALSE,
[D3DRS_ALPHABLENDENABLE] = FALSE,
[D3DRS_FOGENABLE] = FALSE,
[D3DRS_SPECULARENABLE] = FALSE,
/* [D3DRS_ZVISIBLE] = 0, */
[D3DRS_FOGCOLOR] = 0,
[D3DRS_FOGTABLEMODE] = D3DFOG_NONE,
[D3DRS_FOGSTART] = 0x00000000,
[D3DRS_FOGEND] = 0x3F800000,
[D3DRS_FOGDENSITY] = 0x3F800000,
/* [D3DRS_EDGEANTIALIAS] = FALSE, */
[D3DRS_RANGEFOGENABLE] = FALSE,
[D3DRS_STENCILENABLE] = FALSE,
[D3DRS_STENCILFAIL] = D3DSTENCILOP_KEEP,
[D3DRS_STENCILZFAIL] = D3DSTENCILOP_KEEP,
[D3DRS_STENCILPASS] = D3DSTENCILOP_KEEP,
[D3DRS_STENCILREF] = 0,
[D3DRS_STENCILMASK] = 0xFFFFFFFF,
[D3DRS_STENCILFUNC] = D3DCMP_ALWAYS,
[D3DRS_STENCILWRITEMASK] = 0xFFFFFFFF,
[D3DRS_TEXTUREFACTOR] = 0xFFFFFFFF,
[D3DRS_WRAP0] = 0,
[D3DRS_WRAP1] = 0,
[D3DRS_WRAP2] = 0,
[D3DRS_WRAP3] = 0,
[D3DRS_WRAP4] = 0,
[D3DRS_WRAP5] = 0,
[D3DRS_WRAP6] = 0,
[D3DRS_WRAP7] = 0,
[D3DRS_CLIPPING] = TRUE,
[D3DRS_LIGHTING] = TRUE,
[D3DRS_AMBIENT] = 0,
[D3DRS_FOGVERTEXMODE] = D3DFOG_NONE,
[D3DRS_COLORVERTEX] = TRUE,
[D3DRS_LOCALVIEWER] = TRUE,
[D3DRS_NORMALIZENORMALS] = FALSE,
[D3DRS_DIFFUSEMATERIALSOURCE] = D3DMCS_COLOR1,
[D3DRS_SPECULARMATERIALSOURCE] = D3DMCS_COLOR2,
[D3DRS_AMBIENTMATERIALSOURCE] = D3DMCS_MATERIAL,
[D3DRS_EMISSIVEMATERIALSOURCE] = D3DMCS_MATERIAL,
[D3DRS_VERTEXBLEND] = D3DVBF_DISABLE,
[D3DRS_CLIPPLANEENABLE] = 0,
/* [D3DRS_SOFTWAREVERTEXPROCESSING] = FALSE, */
[D3DRS_POINTSIZE] = 0x3F800000,
[D3DRS_POINTSIZE_MIN] = 0x3F800000,
[D3DRS_POINTSPRITEENABLE] = FALSE,
[D3DRS_POINTSCALEENABLE] = FALSE,
[D3DRS_POINTSCALE_A] = 0x3F800000,
[D3DRS_POINTSCALE_B] = 0x00000000,
[D3DRS_POINTSCALE_C] = 0x00000000,
[D3DRS_MULTISAMPLEANTIALIAS] = TRUE,
[D3DRS_MULTISAMPLEMASK] = 0xFFFFFFFF,
[D3DRS_PATCHEDGESTYLE] = D3DPATCHEDGE_DISCRETE,
/* [D3DRS_PATCHSEGMENTS] = 0x3F800000, */
[D3DRS_DEBUGMONITORTOKEN] = 0xDEADCAFE,
[D3DRS_POINTSIZE_MAX] = 0x3F800000, /* depends on cap */
[D3DRS_INDEXEDVERTEXBLENDENABLE] = FALSE,
[D3DRS_COLORWRITEENABLE] = 0x0000000f,
[D3DRS_TWEENFACTOR] = 0x00000000,
[D3DRS_BLENDOP] = D3DBLENDOP_ADD,
[D3DRS_POSITIONDEGREE] = D3DDEGREE_CUBIC,
[D3DRS_NORMALDEGREE] = D3DDEGREE_LINEAR,
[D3DRS_SCISSORTESTENABLE] = FALSE,
[D3DRS_SLOPESCALEDEPTHBIAS] = 0,
[D3DRS_MINTESSELLATIONLEVEL] = 0x3F800000,
[D3DRS_MAXTESSELLATIONLEVEL] = 0x3F800000,
[D3DRS_ANTIALIASEDLINEENABLE] = FALSE,
[D3DRS_ADAPTIVETESS_X] = 0x00000000,
[D3DRS_ADAPTIVETESS_Y] = 0x00000000,
[D3DRS_ADAPTIVETESS_Z] = 0x3F800000,
[D3DRS_ADAPTIVETESS_W] = 0x00000000,
[D3DRS_ENABLEADAPTIVETESSELLATION] = FALSE,
[D3DRS_TWOSIDEDSTENCILMODE] = FALSE,
[D3DRS_CCW_STENCILFAIL] = D3DSTENCILOP_KEEP,
[D3DRS_CCW_STENCILZFAIL] = D3DSTENCILOP_KEEP,
[D3DRS_CCW_STENCILPASS] = D3DSTENCILOP_KEEP,
[D3DRS_CCW_STENCILFUNC] = D3DCMP_ALWAYS,
[D3DRS_COLORWRITEENABLE1] = 0x0000000F,
[D3DRS_COLORWRITEENABLE2] = 0x0000000F,
[D3DRS_COLORWRITEENABLE3] = 0x0000000F,
[D3DRS_BLENDFACTOR] = 0xFFFFFFFF,
[D3DRS_SRGBWRITEENABLE] = 0,
[D3DRS_DEPTHBIAS] = 0,
[D3DRS_WRAP8] = 0,
[D3DRS_WRAP9] = 0,
[D3DRS_WRAP10] = 0,
[D3DRS_WRAP11] = 0,
[D3DRS_WRAP12] = 0,
[D3DRS_WRAP13] = 0,
[D3DRS_WRAP14] = 0,
[D3DRS_WRAP15] = 0,
[D3DRS_SEPARATEALPHABLENDENABLE] = FALSE,
[D3DRS_SRCBLENDALPHA] = D3DBLEND_ONE,
[D3DRS_DESTBLENDALPHA] = D3DBLEND_ZERO,
[D3DRS_BLENDOPALPHA] = D3DBLENDOP_ADD,
[NINED3DRS_VSPOINTSIZE] = FALSE,
[NINED3DRS_RTMASK] = 0xf,
[NINED3DRS_ALPHACOVERAGE] = FALSE,
[NINED3DRS_MULTISAMPLE] = FALSE
};
static const DWORD nine_tex_stage_state_defaults[NINED3DTSS_LAST + 1] =
{
[D3DTSS_COLOROP] = D3DTOP_DISABLE,
[D3DTSS_ALPHAOP] = D3DTOP_DISABLE,
[D3DTSS_COLORARG1] = D3DTA_TEXTURE,
[D3DTSS_COLORARG2] = D3DTA_CURRENT,
[D3DTSS_COLORARG0] = D3DTA_CURRENT,
[D3DTSS_ALPHAARG1] = D3DTA_TEXTURE,
[D3DTSS_ALPHAARG2] = D3DTA_CURRENT,
[D3DTSS_ALPHAARG0] = D3DTA_CURRENT,
[D3DTSS_RESULTARG] = D3DTA_CURRENT,
[D3DTSS_BUMPENVMAT00] = 0,
[D3DTSS_BUMPENVMAT01] = 0,
[D3DTSS_BUMPENVMAT10] = 0,
[D3DTSS_BUMPENVMAT11] = 0,
[D3DTSS_BUMPENVLSCALE] = 0,
[D3DTSS_BUMPENVLOFFSET] = 0,
[D3DTSS_TEXCOORDINDEX] = 0,
[D3DTSS_TEXTURETRANSFORMFLAGS] = D3DTTFF_DISABLE,
};
static const DWORD nine_samp_state_defaults[NINED3DSAMP_LAST + 1] =
{
[D3DSAMP_ADDRESSU] = D3DTADDRESS_WRAP,
[D3DSAMP_ADDRESSV] = D3DTADDRESS_WRAP,
[D3DSAMP_ADDRESSW] = D3DTADDRESS_WRAP,
[D3DSAMP_BORDERCOLOR] = 0,
[D3DSAMP_MAGFILTER] = D3DTEXF_POINT,
[D3DSAMP_MINFILTER] = D3DTEXF_POINT,
[D3DSAMP_MIPFILTER] = D3DTEXF_NONE,
[D3DSAMP_MIPMAPLODBIAS] = 0,
[D3DSAMP_MAXMIPLEVEL] = 0,
[D3DSAMP_MAXANISOTROPY] = 1,
[D3DSAMP_SRGBTEXTURE] = 0,
[D3DSAMP_ELEMENTINDEX] = 0,
[D3DSAMP_DMAPOFFSET] = 0,
[NINED3DSAMP_MINLOD] = 0,
[NINED3DSAMP_SHADOW] = 0,
[NINED3DSAMP_CUBETEX] = 0
};
void nine_state_restore_non_cso(struct NineDevice9 *device)
{
struct nine_context *context = &device->context;
context->changed.group = NINE_STATE_ALL;
context->changed.vtxbuf = (1ULL << device->caps.MaxStreams) - 1;
context->changed.ucp = TRUE;
context->commit |= NINE_STATE_COMMIT_CONST_VS | NINE_STATE_COMMIT_CONST_PS;
}
void
nine_state_set_defaults(struct NineDevice9 *device, const D3DCAPS9 *caps,
boolean is_reset)
{
struct nine_state *state = &device->state;
struct nine_context *context = &device->context;
unsigned s;
/* Initialize defaults.
*/
memcpy(context->rs, nine_render_state_defaults, sizeof(context->rs));
for (s = 0; s < ARRAY_SIZE(state->ff.tex_stage); ++s) {
memcpy(&state->ff.tex_stage[s], nine_tex_stage_state_defaults,
sizeof(state->ff.tex_stage[s]));
state->ff.tex_stage[s][D3DTSS_TEXCOORDINDEX] = s;
}
state->ff.tex_stage[0][D3DTSS_COLOROP] = D3DTOP_MODULATE;
state->ff.tex_stage[0][D3DTSS_ALPHAOP] = D3DTOP_SELECTARG1;
for (s = 0; s < ARRAY_SIZE(state->ff.tex_stage); ++s)
memcpy(&context->ff.tex_stage[s], state->ff.tex_stage[s],
sizeof(state->ff.tex_stage[s]));
memset(&context->bumpmap_vars, 0, sizeof(context->bumpmap_vars));
for (s = 0; s < NINE_MAX_SAMPLERS; ++s) {
memcpy(&context->samp[s], nine_samp_state_defaults,
sizeof(context->samp[s]));
memcpy(&state->samp_advertised[s], nine_samp_state_defaults,
sizeof(state->samp_advertised[s]));
}
memset(state->vs_const_f, 0, VS_CONST_F_SIZE(device));
memset(context->vs_const_f, 0, device->vs_const_size);
if (context->vs_const_f_swvp)
memset(context->vs_const_f_swvp, 0, NINE_MAX_CONST_F_SWVP * sizeof(float[4]));
memset(state->vs_const_i, 0, VS_CONST_I_SIZE(device));
memset(context->vs_const_i, 0, VS_CONST_I_SIZE(device));
memset(state->vs_const_b, 0, VS_CONST_B_SIZE(device));
memset(context->vs_const_b, 0, VS_CONST_B_SIZE(device));
memset(state->ps_const_f, 0, device->ps_const_size);
memset(context->ps_const_f, 0, device->ps_const_size);
memset(state->ps_const_i, 0, sizeof(state->ps_const_i));
memset(context->ps_const_i, 0, sizeof(context->ps_const_i));
memset(state->ps_const_b, 0, sizeof(state->ps_const_b));
memset(context->ps_const_b, 0, sizeof(context->ps_const_b));
/* Cap dependent initial state:
*/
context->rs[D3DRS_POINTSIZE_MAX] = fui(caps->MaxPointSize);
memcpy(state->rs_advertised, context->rs, sizeof(context->rs));
/* Set changed flags to initialize driver.
*/
context->changed.group = NINE_STATE_ALL;
context->changed.vtxbuf = (1ULL << device->caps.MaxStreams) - 1;
context->changed.ucp = TRUE;
context->ff.changed.transform[0] = ~0;
context->ff.changed.transform[D3DTS_WORLD / 32] |= 1 << (D3DTS_WORLD % 32);
if (!is_reset) {
state->viewport.MinZ = context->viewport.MinZ = 0.0f;
state->viewport.MaxZ = context->viewport.MaxZ = 1.0f;
}
for (s = 0; s < NINE_MAX_SAMPLERS; ++s)
context->changed.sampler[s] = ~0;
if (!is_reset) {
context->dummy_vbo_bound_at = -1;
context->vbo_bound_done = FALSE;
}
}
void
nine_state_clear(struct nine_state *state, const boolean device)
{
unsigned i;
for (i = 0; i < ARRAY_SIZE(state->rt); ++i)
nine_bind(&state->rt[i], NULL);
nine_bind(&state->ds, NULL);
nine_bind(&state->vs, NULL);
nine_bind(&state->ps, NULL);
nine_bind(&state->vdecl, NULL);
for (i = 0; i < PIPE_MAX_ATTRIBS; ++i)
nine_bind(&state->stream[i], NULL);
nine_bind(&state->idxbuf, NULL);
for (i = 0; i < NINE_MAX_SAMPLERS; ++i) {
if (device &&
state->texture[i]