src/mesa/drivers/dri/i965/brw_meta_util.c - platform/external/mesa3d - Git at Google

 /*
  * Copyright © 2014 Intel Corporation
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
  * to deal in the Software without restriction, including without limitation
  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  * and/or sell copies of the Software, and to permit persons to whom the
  * Software is furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice (including the next
  * paragraph) shall be included in all copies or substantial portions of the
  * Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  * IN THE SOFTWARE.
  */

 #include "brw_context.h"
 #include "brw_defines.h"
 #include "intel_fbo.h"
 #include "brw_meta_util.h"
 #include "brw_state.h"
 #include "main/blend.h"
 #include "main/fbobject.h"
 #include "util/format_srgb.h"

 /**
  * Helper function for handling mirror image blits.
  *
  * If coord0 > coord1, swap them and invert the "mirror" boolean.
  */
 static inline void
 fixup_mirroring(bool *mirror, float *coord0, float *coord1)
 {
    if (*coord0 > *coord1) {
       *mirror = !*mirror;
       float tmp = *coord0;
       *coord0 = *coord1;
       *coord1 = tmp;
    }
 }

 /**
  * Compute the number of pixels to clip for each side of a rect
  *
  * \param x0 The rect's left coordinate
  * \param y0 The rect's bottom coordinate
  * \param x1 The rect's right coordinate
  * \param y1 The rect's top coordinate
  * \param min_x The clipping region's left coordinate
  * \param min_y The clipping region's bottom coordinate
  * \param max_x The clipping region's right coordinate
  * \param max_y The clipping region's top coordinate
  * \param clipped_x0 The number of pixels to clip from the left side
  * \param clipped_y0 The number of pixels to clip from the bottom side
  * \param clipped_x1 The number of pixels to clip from the right side
  * \param clipped_y1 The number of pixels to clip from the top side
  *
  * \return false if we clip everything away, true otherwise
  */
 static inline bool
 compute_pixels_clipped(float x0, float y0, float x1, float y1,
                        float min_x, float min_y, float max_x, float max_y,
                        float *clipped_x0, float *clipped_y0, float *clipped_x1, float *clipped_y1)
 {
    /* If we are going to clip everything away, stop. */
    if (!(min_x <= max_x &&
          min_y <= max_y &&
          x0 <= max_x &&
          y0 <= max_y &&
          min_x <= x1 &&
          min_y <= y1 &&
          x0 <= x1 &&
          y0 <= y1)) {
       return false;
    }

    if (x0 < min_x)
       *clipped_x0 = min_x - x0;
    else
       *clipped_x0 = 0;
    if (max_x < x1)
       *clipped_x1 = x1 - max_x;
    else
       *clipped_x1 = 0;

    if (y0 < min_y)
       *clipped_y0 = min_y - y0;
    else
       *clipped_y0 = 0;
    if (max_y < y1)
       *clipped_y1 = y1 - max_y;
    else
       *clipped_y1 = 0;

    return true;
 }

 /**
  * Clips a coordinate (left, right, top or bottom) for the src or dst rect
  * (whichever requires the largest clip) and adjusts the coordinate
  * for the other rect accordingly.
  *
  * \param mirror true if mirroring is required
  * \param src the source rect coordinate (for example srcX0)
  * \param dst0 the dst rect coordinate (for example dstX0)
  * \param dst1 the opposite dst rect coordinate (for example dstX1)
  * \param clipped_src0 number of pixels to clip from the src coordinate
  * \param clipped_dst0 number of pixels to clip from the dst coordinate
  * \param clipped_dst1 number of pixels to clip from the opposite dst coordinate
  * \param scale the src vs dst scale involved for that coordinate
  * \param isLeftOrBottom true if we are clipping the left or bottom sides
  *        of the rect.
  */
 static inline void
 clip_coordinates(bool mirror,
                  float *src, float *dst0, float *dst1,
                  float clipped_src0,
                  float clipped_dst0,
                  float clipped_dst1,
                  float scale,
                  bool isLeftOrBottom)
 {
    /* When clipping we need to add or subtract pixels from the original
     * coordinates depending on whether we are acting on the left/bottom
     * or right/top sides of the rect respectively. We assume we have to
     * add them in the code below, and multiply by -1 when we should
     * subtract.
     */
    int mult = isLeftOrBottom ? 1 : -1;

    if (!mirror) {
       if (clipped_src0 >= clipped_dst0 * scale) {
          *src += clipped_src0 * mult;
          *dst0 += clipped_src0 / scale * mult;
       } else {
          *dst0 += clipped_dst0 * mult;
          *src += clipped_dst0 * scale * mult;
       }
    } else {
       if (clipped_src0 >= clipped_dst1 * scale) {
          *src += clipped_src0 * mult;
          *dst1 -= clipped_src0 / scale * mult;
       } else {
          *dst1 -= clipped_dst1 * mult;
          *src += clipped_dst1 * scale * mult;
       }
    }
 }

 bool
 brw_meta_mirror_clip_and_scissor(const struct gl_context *ctx,
                                  const struct gl_framebuffer *read_fb,
                                  const struct gl_framebuffer *draw_fb,
                                  GLfloat *srcX0, GLfloat *srcY0,
                                  GLfloat *srcX1, GLfloat *srcY1,
                                  GLfloat *dstX0, GLfloat *dstY0,
                                  GLfloat *dstX1, GLfloat *dstY1,
                                  bool *mirror_x, bool *mirror_y)
 {
    *mirror_x = false;
    *mirror_y = false;

    /* Detect if the blit needs to be mirrored */
    fixup_mirroring(mirror_x, srcX0, srcX1);
    fixup_mirroring(mirror_x, dstX0, dstX1);
    fixup_mirroring(mirror_y, srcY0, srcY1);
    fixup_mirroring(mirror_y, dstY0, dstY1);

    /* Compute number of pixels to clip for each side of both rects. Return
     * early if we are going to clip everything away.
     */
    float clip_src_x0;
    float clip_src_x1;
    float clip_src_y0;
    float clip_src_y1;
    float clip_dst_x0;
    float clip_dst_x1;
    float clip_dst_y0;
    float clip_dst_y1;

    if (!compute_pixels_clipped(*srcX0, *srcY0, *srcX1, *srcY1,
                                0, 0, read_fb->Width, read_fb->Height,
                                &clip_src_x0, &clip_src_y0, &clip_src_x1, &clip_src_y1))
       return true;

    if (!compute_pixels_clipped(*dstX0, *dstY0, *dstX1, *dstY1,
                                draw_fb->_Xmin, draw_fb->_Ymin, draw_fb->_Xmax, draw_fb->_Ymax,
                                &clip_dst_x0, &clip_dst_y0, &clip_dst_x1, &clip_dst_y1))
       return true;

    /* When clipping any of the two rects we need to adjust the coordinates in
     * the other rect considering the scaling factor involved. To obtain the best
     * precision we want to make sure that we only clip once per side to avoid
     * accumulating errors due to the scaling adjustment.
     *
     * For example, if srcX0 and dstX0 need both to be clipped we want to avoid
     * the situation where we clip srcX0 first, then adjust dstX0 accordingly
     * but then we realize that the resulting dstX0 still needs to be clipped,
     * so we clip dstX0 and adjust srcX0 again. Because we are applying scaling
     * factors to adjust the coordinates in each clipping pass we lose some
     * precision and that can affect the results of the blorp blit operation
     * slightly. What we want to do here is detect the rect that we should
     * clip first for each side so that when we adjust the other rect we ensure
     * the resulting coordinate does not need to be clipped again.
     *
     * The code below implements this by comparing the number of pixels that
     * we need to clip for each side of both rects  considering the scales
     * involved. For example, clip_src_x0 represents the number of pixels to be
     * clipped for the src rect's left side, so if clip_src_x0 = 5,
     * clip_dst_x0 = 4 and scaleX = 2 it means that we are clipping more from
     * the dst rect so we should clip dstX0 only and adjust srcX0. This is
     * because clipping 4 pixels in the dst is equivalent to clipping
     * 4 * 2 = 8 > 5 in the src.
     */

    float scaleX = (float) (*srcX1 - *srcX0) / (*dstX1 - *dstX0);
    float scaleY = (float) (*srcY1 - *srcY0) / (*dstY1 - *dstY0);

    /* Clip left side */
    clip_coordinates(*mirror_x,
                     srcX0, dstX0, dstX1,
                     clip_src_x0, clip_dst_x0, clip_dst_x1,
                     scaleX, true);

    /* Clip right side */
    clip_coordinates(*mirror_x,
                     srcX1, dstX1, dstX0,
                     clip_src_x1, clip_dst_x1, clip_dst_x0,
                     scaleX, false);

    /* Clip bottom side */
    clip_coordinates(*mirror_y,
                     srcY0, dstY0, dstY1,
                     clip_src_y0, clip_dst_y0, clip_dst_y1,
                     scaleY, true);

    /* Clip top side */
    clip_coordinates(*mirror_y,
                     srcY1, dstY1, dstY0,
                     clip_src_y1, clip_dst_y1, clip_dst_y0,
                     scaleY, false);

    /* Account for the fact that in the system framebuffer, the origin is at
     * the lower left.
     */
    if (_mesa_is_winsys_fbo(read_fb)) {
       GLint tmp = read_fb->Height - *srcY0;
       *srcY0 = read_fb->Height - *srcY1;
       *srcY1 = tmp;
       *mirror_y = !*mirror_y;
    }
    if (_mesa_is_winsys_fbo(draw_fb)) {
       GLint tmp = draw_fb->Height - *dstY0;
       *dstY0 = draw_fb->Height - *dstY1;
       *dstY1 = tmp;
       *mirror_y = !*mirror_y;
    }

    return false;
 }

 /**
  * Creates a new named renderbuffer that wraps the first slice
  * of an existing miptree.
  *
  * Clobbers the current renderbuffer binding (ctx->CurrentRenderbuffer).
  */
 struct gl_renderbuffer *
 brw_get_rb_for_slice(struct brw_context *brw,
                      struct intel_mipmap_tree *mt,
                      unsigned level, unsigned layer, bool flat)
 {
    struct gl_context *ctx = &brw->ctx;
    struct gl_renderbuffer *rb = ctx->Driver.NewRenderbuffer(ctx, 0xDEADBEEF);
    struct intel_renderbuffer *irb = intel_renderbuffer(rb);

    rb->RefCount = 1;
    rb->Format = mt->format;
    rb->_BaseFormat = _mesa_get_format_base_format(mt->format);

    /* Program takes care of msaa and mip-level access manually for stencil.
     * The surface is also treated as Y-tiled instead of as W-tiled calling for
     * twice the width and half the height in dimensions.
     */
    if (flat) {
       const unsigned halign_stencil = 8;

       rb->NumSamples = 0;
       rb->Width = ALIGN(mt->total_width, halign_stencil) * 2;
       rb->Height = (mt->total_height / mt->physical_depth0) / 2;
       irb->mt_level = 0;
    } else {
       rb->NumSamples = mt->num_samples;
       rb->Width = mt->logical_width0;
       rb->Height = mt->logical_height0;
       irb->mt_level = level;
    }

    irb->mt_layer = layer;

    intel_miptree_reference(&irb->mt, mt);

    return rb;
 }

 /**
  * Determine if fast color clear supports the given clear color.
  *
  * Fast color clear can only clear to color values of 1.0 or 0.0.  At the
  * moment we only support floating point, unorm, and snorm buffers.
  */
 bool
 brw_is_color_fast_clear_compatible(struct brw_context *brw,
                                    const struct intel_mipmap_tree *mt,
                                    const union gl_color_union *color)
 {
    const struct gl_context *ctx = &brw->ctx;

    /* If we're mapping the render format to a different format than the
     * format we use for texturing then it is a bit questionable whether it
     * should be possible to use a fast clear. Although we only actually
     * render using a renderable format, without the override workaround it
     * wouldn't be possible to have a non-renderable surface in a fast clear
     * state so the hardware probably legitimately doesn't need to support
     * this case. At least on Gen9 this really does seem to cause problems.
     */
    if (brw->gen >= 9 &&
        brw_format_for_mesa_format(mt->format) !=
        brw->render_target_format[mt->format])
       return false;

    /* Gen9 doesn't support fast clear on single-sampled SRGB buffers. When
     * GL_FRAMEBUFFER_SRGB is enabled any color renderbuffers will be
     * resolved in intel_update_state. In that case it's pointless to do a
     * fast clear because it's very likely to be immediately resolved.
     */
    if (brw->gen >= 9 &&
        mt->num_samples <= 1 &&
        ctx->Color.sRGBEnabled &&
        _mesa_get_srgb_format_linear(mt->format) != mt->format)
       return false;

    const mesa_format format = _mesa_get_render_format(ctx, mt->format);
    if (_mesa_is_format_integer_color(format)) {
       if (brw->gen >= 8) {
          perf_debug("Integer fast clear not enabled for (%s)",
                     _mesa_get_format_name(format));
       }
       return false;
    }

    for (int i = 0; i < 4; i++) {
       if (!_mesa_format_has_color_component(format, i)) {
          continue;
       }

       if (brw->gen < 9 &&
           color->f[i] != 0.0f && color->f[i] != 1.0f) {
          return false;
       }
    }
    return true;
 }

 /**
  * Convert the given color to a bitfield suitable for ORing into DWORD 7 of
  * SURFACE_STATE (DWORD 12-15 on SKL+).
  */
 union gl_color_union
 brw_meta_convert_fast_clear_color(const struct brw_context *brw,
                                   const struct intel_mipmap_tree *mt,
                                   const union gl_color_union *color)
 {
    union gl_color_union override_color = *color;

    /* The sampler doesn't look at the format of the surface when the fast
     * clear color is used so we need to implement luminance, intensity and
     * missing components manually.
     */
    switch (_mesa_get_format_base_format(mt->format)) {
    case GL_INTENSITY:
       override_color.ui[3] = override_color.ui[0];
       /* flow through */
    case GL_LUMINANCE:
    case GL_LUMINANCE_ALPHA:
       override_color.ui[1] = override_color.ui[0];
       override_color.ui[2] = override_color.ui[0];
       break;
    default:
       for (int i = 0; i < 3; i++) {
          if (!_mesa_format_has_color_component(mt->format, i))
             override_color.ui[i] = 0;
       }
       break;
    }

    if (!_mesa_format_has_color_component(mt->format, 3)) {
       if (_mesa_is_format_integer_color(mt->format))
          override_color.ui[3] = 1;
       else
          override_color.f[3] = 1.0f;
    }

    /* Handle linear to SRGB conversion */
    if (brw->ctx.Color.sRGBEnabled &&
        _mesa_get_srgb_format_linear(mt->format) != mt->format) {
       for (int i = 0; i < 3; i++) {
          override_color.f[i] =
             util_format_linear_to_srgb_float(override_color.f[i]);
       }
    }

    return override_color;
 }

 /* Returned boolean tells if the given color differs from the current. */
 bool
 brw_meta_set_fast_clear_color(struct brw_context *brw,
                               union gl_color_union *curr_color,
                               const union gl_color_union *new_color)
 {
    bool updated;

    if (brw->gen >= 9) {
       updated = memcmp(curr_color, new_color, sizeof(*curr_color));
       *curr_color = *new_color;
    } else {
       const uint32_t old_color_value = *(uint32_t *)curr_color;
       uint32_t adjusted = 0;

       for (int i = 0; i < 4; i++) {
          /* Testing for non-0 works for integer and float colors */
          if (new_color->f[i] != 0.0f) {
             adjusted |= 1 << (GEN7_SURFACE_CLEAR_COLOR_SHIFT + (3 - i));
          }
       }

       updated = (old_color_value != adjusted);
       *(uint32_t *)curr_color = adjusted;
    }

    return updated;
 }
	/*
	* Copyright © 2014 Intel Corporation
	*
	* Permission is hereby granted, free of charge, to any person obtaining a
	* copy of this software and associated documentation files (the "Software"),
	* to deal in the Software without restriction, including without limitation
	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
	* and/or sell copies of the Software, and to permit persons to whom the
	* Software is furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice (including the next
	* paragraph) shall be included in all copies or substantial portions of the
	* Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
	* IN THE SOFTWARE.
	*/

	#include "brw_context.h"
	#include "brw_defines.h"
	#include "intel_fbo.h"
	#include "brw_meta_util.h"
	#include "brw_state.h"
	#include "main/blend.h"
	#include "main/fbobject.h"
	#include "util/format_srgb.h"

	/**
	* Helper function for handling mirror image blits.
	*
	* If coord0 > coord1, swap them and invert the "mirror" boolean.
	*/
	static inline void
	fixup_mirroring(bool mirror, float coord0, float *coord1)
	{
	if (coord0 > coord1) {
	mirror = !mirror;
	float tmp = *coord0;
	coord0 = coord1;
	*coord1 = tmp;
	}
	}

	/**
	* Compute the number of pixels to clip for each side of a rect
	*
	* \param x0 The rect's left coordinate
	* \param y0 The rect's bottom coordinate
	* \param x1 The rect's right coordinate
	* \param y1 The rect's top coordinate
	* \param min_x The clipping region's left coordinate
	* \param min_y The clipping region's bottom coordinate
	* \param max_x The clipping region's right coordinate
	* \param max_y The clipping region's top coordinate
	* \param clipped_x0 The number of pixels to clip from the left side
	* \param clipped_y0 The number of pixels to clip from the bottom side
	* \param clipped_x1 The number of pixels to clip from the right side
	* \param clipped_y1 The number of pixels to clip from the top side
	*
	* \return false if we clip everything away, true otherwise
	*/
	static inline bool
	compute_pixels_clipped(float x0, float y0, float x1, float y1,
	float min_x, float min_y, float max_x, float max_y,
	float clipped_x0, float clipped_y0, float clipped_x1, float clipped_y1)
	{
	/* If we are going to clip everything away, stop. */
	if (!(min_x <= max_x &&
	min_y <= max_y &&
	x0 <= max_x &&
	y0 <= max_y &&
	min_x <= x1 &&
	min_y <= y1 &&
	x0 <= x1 &&
	y0 <= y1)) {
	return false;
	}

	if (x0 < min_x)
	*clipped_x0 = min_x - x0;
	else
	*clipped_x0 = 0;
	if (max_x < x1)
	*clipped_x1 = x1 - max_x;
	else
	*clipped_x1 = 0;

	if (y0 < min_y)
	*clipped_y0 = min_y - y0;
	else
	*clipped_y0 = 0;
	if (max_y < y1)
	*clipped_y1 = y1 - max_y;
	else
	*clipped_y1 = 0;

	return true;
	}

	/**
	* Clips a coordinate (left, right, top or bottom) for the src or dst rect
	* (whichever requires the largest clip) and adjusts the coordinate
	* for the other rect accordingly.
	*
	* \param mirror true if mirroring is required
	* \param src the source rect coordinate (for example srcX0)
	* \param dst0 the dst rect coordinate (for example dstX0)
	* \param dst1 the opposite dst rect coordinate (for example dstX1)
	* \param clipped_src0 number of pixels to clip from the src coordinate
	* \param clipped_dst0 number of pixels to clip from the dst coordinate
	* \param clipped_dst1 number of pixels to clip from the opposite dst coordinate
	* \param scale the src vs dst scale involved for that coordinate
	* \param isLeftOrBottom true if we are clipping the left or bottom sides
	* of the rect.
	*/
	static inline void
	clip_coordinates(bool mirror,
	float src, float dst0, float *dst1,
	float clipped_src0,
	float clipped_dst0,
	float clipped_dst1,
	float scale,
	bool isLeftOrBottom)
	{
	/* When clipping we need to add or subtract pixels from the original
	* coordinates depending on whether we are acting on the left/bottom
	* or right/top sides of the rect respectively. We assume we have to
	* add them in the code below, and multiply by -1 when we should
	* subtract.
	*/
	int mult = isLeftOrBottom ? 1 : -1;

	if (!mirror) {
	if (clipped_src0 >= clipped_dst0 * scale) {
	src += clipped_src0 mult;
	dst0 += clipped_src0 / scale mult;
	} else {
	dst0 += clipped_dst0 mult;
	src += clipped_dst0 scale * mult;
	}
	} else {
	if (clipped_src0 >= clipped_dst1 * scale) {
	src += clipped_src0 mult;
	dst1 -= clipped_src0 / scale mult;
	} else {
	dst1 -= clipped_dst1 mult;
	src += clipped_dst1 scale * mult;
	}
	}
	}

	bool
	brw_meta_mirror_clip_and_scissor(const struct gl_context *ctx,
	const struct gl_framebuffer *read_fb,
	const struct gl_framebuffer *draw_fb,
	GLfloat srcX0, GLfloat srcY0,
	GLfloat srcX1, GLfloat srcY1,
	GLfloat dstX0, GLfloat dstY0,
	GLfloat dstX1, GLfloat dstY1,
	bool mirror_x, bool mirror_y)
	{
	*mirror_x = false;
	*mirror_y = false;

	/* Detect if the blit needs to be mirrored */
	fixup_mirroring(mirror_x, srcX0, srcX1);
	fixup_mirroring(mirror_x, dstX0, dstX1);
	fixup_mirroring(mirror_y, srcY0, srcY1);
	fixup_mirroring(mirror_y, dstY0, dstY1);

	/* Compute number of pixels to clip for each side of both rects. Return
	* early if we are going to clip everything away.
	*/
	float clip_src_x0;
	float clip_src_x1;
	float clip_src_y0;
	float clip_src_y1;
	float clip_dst_x0;
	float clip_dst_x1;
	float clip_dst_y0;
	float clip_dst_y1;

	if (!compute_pixels_clipped(srcX0, srcY0, srcX1, srcY1,
	0, 0, read_fb->Width, read_fb->Height,
	&clip_src_x0, &clip_src_y0, &clip_src_x1, &clip_src_y1))
	return true;

	if (!compute_pixels_clipped(dstX0, dstY0, dstX1, dstY1,
	draw_fb->_Xmin, draw_fb->_Ymin, draw_fb->_Xmax, draw_fb->_Ymax,
	&clip_dst_x0, &clip_dst_y0, &clip_dst_x1, &clip_dst_y1))
	return true;

	/* When clipping any of the two rects we need to adjust the coordinates in
	* the other rect considering the scaling factor involved. To obtain the best
	* precision we want to make sure that we only clip once per side to avoid
	* accumulating errors due to the scaling adjustment.
	*
	* For example, if srcX0 and dstX0 need both to be clipped we want to avoid
	* the situation where we clip srcX0 first, then adjust dstX0 accordingly
	* but then we realize that the resulting dstX0 still needs to be clipped,
	* so we clip dstX0 and adjust srcX0 again. Because we are applying scaling
	* factors to adjust the coordinates in each clipping pass we lose some
	* precision and that can affect the results of the blorp blit operation
	* slightly. What we want to do here is detect the rect that we should
	* clip first for each side so that when we adjust the other rect we ensure
	* the resulting coordinate does not need to be clipped again.
	*
	* The code below implements this by comparing the number of pixels that
	* we need to clip for each side of both rects considering the scales
	* involved. For example, clip_src_x0 represents the number of pixels to be
	* clipped for the src rect's left side, so if clip_src_x0 = 5,
	* clip_dst_x0 = 4 and scaleX = 2 it means that we are clipping more from
	* the dst rect so we should clip dstX0 only and adjust srcX0. This is
	* because clipping 4 pixels in the dst is equivalent to clipping
	* 4 * 2 = 8 > 5 in the src.
	*/

	float scaleX = (float) (srcX1 - srcX0) / (dstX1 - dstX0);
	float scaleY = (float) (srcY1 - srcY0) / (dstY1 - dstY0);

	/* Clip left side */
	clip_coordinates(*mirror_x,
	srcX0, dstX0, dstX1,
	clip_src_x0, clip_dst_x0, clip_dst_x1,
	scaleX, true);

	/* Clip right side */
	clip_coordinates(*mirror_x,
	srcX1, dstX1, dstX0,
	clip_src_x1, clip_dst_x1, clip_dst_x0,
	scaleX, false);

	/* Clip bottom side */
	clip_coordinates(*mirror_y,
	srcY0, dstY0, dstY1,
	clip_src_y0, clip_dst_y0, clip_dst_y1,
	scaleY, true);

	/* Clip top side */
	clip_coordinates(*mirror_y,
	srcY1, dstY1, dstY0,
	clip_src_y1, clip_dst_y1, clip_dst_y0,
	scaleY, false);

	/* Account for the fact that in the system framebuffer, the origin is at
	* the lower left.
	*/
	if (_mesa_is_winsys_fbo(read_fb)) {
	GLint tmp = read_fb->Height - *srcY0;
	srcY0 = read_fb->Height - srcY1;
	*srcY1 = tmp;
	mirror_y = !mirror_y;
	}
	if (_mesa_is_winsys_fbo(draw_fb)) {
	GLint tmp = draw_fb->Height - *dstY0;
	dstY0 = draw_fb->Height - dstY1;
	*dstY1 = tmp;
	mirror_y = !mirror_y;
	}

	return false;
	}

	/**
	* Creates a new named renderbuffer that wraps the first slice
	* of an existing miptree.
	*
	* Clobbers the current renderbuffer binding (ctx->CurrentRenderbuffer).
	*/
	struct gl_renderbuffer *
	brw_get_rb_for_slice(struct brw_context *brw,
	struct intel_mipmap_tree *mt,
	unsigned level, unsigned layer, bool flat)
	{
	struct gl_context *ctx = &brw->ctx;
	struct gl_renderbuffer *rb = ctx->Driver.NewRenderbuffer(ctx, 0xDEADBEEF);
	struct intel_renderbuffer *irb = intel_renderbuffer(rb);

	rb->RefCount = 1;
	rb->Format = mt->format;
	rb->_BaseFormat = _mesa_get_format_base_format(mt->format);

	/* Program takes care of msaa and mip-level access manually for stencil.
	* The surface is also treated as Y-tiled instead of as W-tiled calling for
	* twice the width and half the height in dimensions.
	*/
	if (flat) {
	const unsigned halign_stencil = 8;

	rb->NumSamples = 0;
	rb->Width = ALIGN(mt->total_width, halign_stencil) * 2;
	rb->Height = (mt->total_height / mt->physical_depth0) / 2;
	irb->mt_level = 0;
	} else {
	rb->NumSamples = mt->num_samples;
	rb->Width = mt->logical_width0;
	rb->Height = mt->logical_height0;
	irb->mt_level = level;
	}

	irb->mt_layer = layer;

	intel_miptree_reference(&irb->mt, mt);

	return rb;
	}

	/**
	* Determine if fast color clear supports the given clear color.
	*
	* Fast color clear can only clear to color values of 1.0 or 0.0. At the
	* moment we only support floating point, unorm, and snorm buffers.
	*/
	bool
	brw_is_color_fast_clear_compatible(struct brw_context *brw,
	const struct intel_mipmap_tree *mt,
	const union gl_color_union *color)
	{
	const struct gl_context *ctx = &brw->ctx;

	/* If we're mapping the render format to a different format than the
	* format we use for texturing then it is a bit questionable whether it
	* should be possible to use a fast clear. Although we only actually
	* render using a renderable format, without the override workaround it
	* wouldn't be possible to have a non-renderable surface in a fast clear
	* state so the hardware probably legitimately doesn't need to support
	* this case. At least on Gen9 this really does seem to cause problems.
	*/
	if (brw->gen >= 9 &&
	brw_format_for_mesa_format(mt->format) !=
	brw->render_target_format[mt->format])
	return false;

	/* Gen9 doesn't support fast clear on single-sampled SRGB buffers. When
	* GL_FRAMEBUFFER_SRGB is enabled any color renderbuffers will be
	* resolved in intel_update_state. In that case it's pointless to do a
	* fast clear because it's very likely to be immediately resolved.
	*/
	if (brw->gen >= 9 &&
	mt->num_samples <= 1 &&
	ctx->Color.sRGBEnabled &&
	_mesa_get_srgb_format_linear(mt->format) != mt->format)
	return false;

	const mesa_format format = _mesa_get_render_format(ctx, mt->format);
	if (_mesa_is_format_integer_color(format)) {
	if (brw->gen >= 8) {
	perf_debug("Integer fast clear not enabled for (%s)",
	_mesa_get_format_name(format));
	}
	return false;
	}

	for (int i = 0; i < 4; i++) {
	if (!_mesa_format_has_color_component(format, i)) {
	continue;
	}

	if (brw->gen < 9 &&
	color->f[i] != 0.0f && color->f[i] != 1.0f) {
	return false;
	}
	}
	return true;
	}

	/**
	* Convert the given color to a bitfield suitable for ORing into DWORD 7 of
	* SURFACE_STATE (DWORD 12-15 on SKL+).
	*/
	union gl_color_union
	brw_meta_convert_fast_clear_color(const struct brw_context *brw,
	const struct intel_mipmap_tree *mt,
	const union gl_color_union *color)
	{
	union gl_color_union override_color = *color;

	/* The sampler doesn't look at the format of the surface when the fast
	* clear color is used so we need to implement luminance, intensity and
	* missing components manually.
	*/
	switch (_mesa_get_format_base_format(mt->format)) {
	case GL_INTENSITY:
	override_color.ui[3] = override_color.ui[0];
	/* flow through */
	case GL_LUMINANCE:
	case GL_LUMINANCE_ALPHA:
	override_color.ui[1] = override_color.ui[0];
	override_color.ui[2] = override_color.ui[0];
	break;
	default:
	for (int i = 0; i < 3; i++) {
	if (!_mesa_format_has_color_component(mt->format, i))
	override_color.ui[i] = 0;
	}
	break;
	}

	if (!_mesa_format_has_color_component(mt->format, 3)) {
	if (_mesa_is_format_integer_color(mt->format))
	override_color.ui[3] = 1;
	else
	override_color.f[3] = 1.0f;
	}

	/* Handle linear to SRGB conversion */
	if (brw->ctx.Color.sRGBEnabled &&
	_mesa_get_srgb_format_linear(mt->format) != mt->format) {
	for (int i = 0; i < 3; i++) {
	override_color.f[i] =
	util_format_linear_to_srgb_float(override_color.f[i]);
	}
	}

	return override_color;
	}

	/* Returned boolean tells if the given color differs from the current. */
	bool
	brw_meta_set_fast_clear_color(struct brw_context *brw,
	union gl_color_union *curr_color,
	const union gl_color_union *new_color)
	{
	bool updated;

	if (brw->gen >= 9) {
	updated = memcmp(curr_color, new_color, sizeof(*curr_color));
	curr_color = new_color;
	} else {
	const uint32_t old_color_value = (uint32_t )curr_color;
	uint32_t adjusted = 0;

	for (int i = 0; i < 4; i++) {
	/* Testing for non-0 works for integer and float colors */
	if (new_color->f[i] != 0.0f) {
	adjusted \|= 1 << (GEN7_SURFACE_CLEAR_COLOR_SHIFT + (3 - i));
	}
	}

	updated = (old_color_value != adjusted);
	(uint32_t )curr_color = adjusted;
	}

	return updated;
	}