[Intel-gfx] [PATCH 2/5] gem_stress: make it library friendly

Ben Widawsky ben at bwidawsk.net
Mon Jan 16 03:21:23 CET 2012


These are mostly just renames, and some very small refactors.

Cc: Daniel Vetter <daniel.vetter at ffwll.ch>
Signed-off-by: Ben Widawsky <ben at bwidawsk.net>
---
 lib/Makefile.am         |    5 +
 lib/gem_stress.h        |  118 ++++
 lib/gem_stress_gen6.c   |  581 ++++++++++++++++++
 lib/gem_stress_i830.c   |  354 +++++++++++
 lib/gem_stress_i915.c   |  190 ++++++
 lib/gen6_render.h       | 1553 +++++++++++++++++++++++++++++++++++++++++++++++
 lib/intel_gpu_tools.h   |    5 +
 tests/Makefile.am       |    5 -
 tests/gem_stress.c      |   23 +-
 tests/gem_stress.h      |  100 ---
 tests/gem_stress_gen6.c |  595 ------------------
 tests/gem_stress_i830.c |  354 -----------
 tests/gem_stress_i915.c |  190 ------
 tests/gen6_render.h     | 1553 -----------------------------------------------
 14 files changed, 2822 insertions(+), 2804 deletions(-)
 create mode 100644 lib/gem_stress.h
 create mode 100644 lib/gem_stress_gen6.c
 create mode 100644 lib/gem_stress_i830.c
 create mode 100644 lib/gem_stress_i915.c
 create mode 100644 lib/gen6_render.h
 delete mode 100644 tests/gem_stress.h
 delete mode 100644 tests/gem_stress_gen6.c
 delete mode 100644 tests/gem_stress_i830.c
 delete mode 100644 tests/gem_stress_i915.c
 delete mode 100644 tests/gen6_render.h

diff --git a/lib/Makefile.am b/lib/Makefile.am
index 9607fcb..6e6463a 100644
--- a/lib/Makefile.am
+++ b/lib/Makefile.am
@@ -21,5 +21,10 @@ libintel_tools_la_SOURCES = 	\
 	intel_mmio.c		\
 	intel_pci.c		\
 	intel_reg.h		\
+	gem_stress.h		\
+	gem_stress_i915.c	\
+	gem_stress_i830.c	\
+	gen6_render.h		\
+	gem_stress_gen6.c	\
 	intel_reg_map.c
 
diff --git a/lib/gem_stress.h b/lib/gem_stress.h
new file mode 100644
index 0000000..0db2229
--- /dev/null
+++ b/lib/gem_stress.h
@@ -0,0 +1,118 @@
+#ifndef _GEM_STRESS_H_
+#define _GEM_STRESS_H_
+
+#include <stdlib.h>
+#include <sys/ioctl.h>
+#include <stdio.h>
+#include <string.h>
+#include <assert.h>
+#include <fcntl.h>
+#include <inttypes.h>
+#include <errno.h>
+#include <sys/stat.h>
+#include <sys/time.h>
+#include <getopt.h>
+#include "drm.h"
+#include "i915_drm.h"
+#include "drmtest.h"
+#include "intel_bufmgr.h"
+#include "intel_batchbuffer.h"
+#include "intel_gpu_tools.h"
+
+struct scratch_buf {
+    drm_intel_bo *bo;
+    uint32_t stride;
+    uint32_t tiling;
+    uint32_t *data;
+    uint32_t *cpu_mapping;
+    unsigned num_tiles;
+};
+
+struct option_struct {
+    unsigned scratch_buf_size;
+    unsigned max_dimension;
+    unsigned num_buffers;
+    int trace_tile;
+    int no_hw;
+    int gpu_busy_load;
+    int use_render;
+    int use_blt;
+    int forced_tiling;
+    int use_cpu_maps;
+    int total_rounds;
+    int fail;
+    int tiles_per_buf;
+    int ducttape;
+    int tile_size;
+    int check_render_cpyfn;
+    int use_signal_helper;
+};
+
+extern struct option_struct options;
+extern drm_intel_bufmgr *bufmgr;
+extern struct intel_batchbuffer *batch;
+extern int drm_fd;
+extern int devid;
+
+extern int fence_storm;
+
+#define MAX_BUFS		4096
+#define SCRATCH_BUF_SIZE	1024*1024
+#define BUSY_BUF_SIZE		(256*4096)
+#define TILE_BYTES(size)	((size)*(size)*sizeof(uint32_t))
+
+void keep_gpu_busy(void);
+
+static inline void emit_vertex_2s(int16_t x, int16_t y)
+{
+	OUT_BATCH((uint16_t)y << 16 | (uint16_t)x);
+}
+
+static inline void emit_vertex(float f)
+{
+	union { float f; uint32_t ui; } u;
+	u.f = f;
+	OUT_BATCH(u.ui);
+}
+
+static inline void emit_vertex_normalized(float f, float total)
+{
+	union { float f; uint32_t ui; } u;
+	u.f = f / total;
+	OUT_BATCH(u.ui);
+}
+
+static inline unsigned buf_width(struct scratch_buf *buf)
+{
+	return buf->stride/sizeof(uint32_t);
+}
+
+static inline unsigned buf_height(struct scratch_buf *buf)
+{
+	return options.scratch_buf_size/buf->stride;
+}
+
+static inline void
+gen6_render_flush(uint32_t batch_end)
+{
+	int ret;
+
+	ret = drm_intel_bo_subdata(batch->bo, 0, 4096, batch->buffer);
+	if (ret == 0)
+		ret = drm_intel_bo_mrb_exec(batch->bo, batch_end,
+					    NULL, 0, 0, 0);
+	assert(ret == 0);
+}
+
+
+uint32_t gen6_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+			      struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+			      unsigned logical_tile_no);
+uint32_t gen3_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+			      struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+			      unsigned logical_tile_no);
+uint32_t gen2_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+			      struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+			      unsigned logical_tile_no);
+
+#endif
diff --git a/lib/gem_stress_gen6.c b/lib/gem_stress_gen6.c
new file mode 100644
index 0000000..e38b4f9
--- /dev/null
+++ b/lib/gem_stress_gen6.c
@@ -0,0 +1,581 @@
+#include "gem_stress.h"
+#include "gen6_render.h"
+
+#include <assert.h>
+
+#define ALIGN(x, y) (((x) + (y)-1) & ~((y)-1))
+#define VERTEX_SIZE (3*4)
+
+static const uint32_t ps_kernel_nomask_affine[][4] = {
+	{ 0x0060005a, 0x204077be, 0x000000c0, 0x008d0040 },
+	{ 0x0060005a, 0x206077be, 0x000000c0, 0x008d0080 },
+	{ 0x0060005a, 0x208077be, 0x000000d0, 0x008d0040 },
+	{ 0x0060005a, 0x20a077be, 0x000000d0, 0x008d0080 },
+	{ 0x00000201, 0x20080061, 0x00000000, 0x00000000 },
+	{ 0x00600001, 0x20200022, 0x008d0000, 0x00000000 },
+	{ 0x02800031, 0x21c01cc9, 0x00000020, 0x0a8a0001 },
+	{ 0x00600001, 0x204003be, 0x008d01c0, 0x00000000 },
+	{ 0x00600001, 0x206003be, 0x008d01e0, 0x00000000 },
+	{ 0x00600001, 0x208003be, 0x008d0200, 0x00000000 },
+	{ 0x00600001, 0x20a003be, 0x008d0220, 0x00000000 },
+	{ 0x00600001, 0x20c003be, 0x008d0240, 0x00000000 },
+	{ 0x00600001, 0x20e003be, 0x008d0260, 0x00000000 },
+	{ 0x00600001, 0x210003be, 0x008d0280, 0x00000000 },
+	{ 0x00600001, 0x212003be, 0x008d02a0, 0x00000000 },
+	{ 0x05800031, 0x24001cc8, 0x00000040, 0x90019000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
+};
+
+static uint32_t
+batch_used(void)
+{
+	return batch->ptr - batch->buffer;
+}
+
+static uint32_t
+batch_align(uint32_t align)
+{
+	uint32_t offset = batch_used();
+	offset = ALIGN(offset, align);
+	batch->ptr = batch->buffer + offset;
+	return offset;
+}
+
+static uint32_t
+batch_round_upto(uint32_t divisor)
+{
+	uint32_t offset = batch_used();
+	offset = (offset + divisor-1) / divisor * divisor;
+	batch->ptr = batch->buffer + offset;
+	return offset;
+}
+
+static void *
+batch_alloc(uint32_t size, uint32_t align)
+{
+	uint32_t offset = batch_align(align);
+	batch->ptr += size;
+	return memset(batch->buffer + offset, 0, size);
+}
+
+static uint32_t
+batch_offset(void *ptr)
+{
+	return (uint8_t *)ptr - batch->buffer;
+}
+
+static uint32_t
+batch_copy(const void *ptr, uint32_t size, uint32_t align)
+{
+	return batch_offset(memcpy(batch_alloc(size, align), ptr, size));
+}
+
+static uint32_t
+gen6_bind_buf(struct scratch_buf *buf,
+	      uint32_t format, int is_dst)
+{
+	struct gen6_surface_state *ss;
+	uint32_t write_domain, read_domain;
+	int ret;
+
+	if (is_dst) {
+		write_domain = read_domain = I915_GEM_DOMAIN_RENDER;
+	} else {
+		write_domain = 0;
+		read_domain = I915_GEM_DOMAIN_SAMPLER;
+	}
+
+	ss = batch_alloc(sizeof(*ss), 32);
+	ss->ss0.surface_type = GEN6_SURFACE_2D;
+	ss->ss0.surface_format = format;
+
+	ss->ss0.data_return_format = GEN6_SURFACERETURNFORMAT_FLOAT32;
+	ss->ss0.color_blend = 1;
+	ss->ss1.base_addr = buf->bo->offset;
+
+	ret = drm_intel_bo_emit_reloc(batch->bo,
+				      batch_offset(ss) + 4,
+				      buf->bo, 0,
+				      read_domain, write_domain);
+	assert(ret == 0);
+
+	ss->ss2.height = buf_height(buf) - 1;
+	ss->ss2.width  = buf_width(buf) - 1;
+	ss->ss3.pitch  = buf->stride - 1;
+	ss->ss3.tiled_surface = buf->tiling != I915_TILING_NONE;
+	ss->ss3.tile_walk     = buf->tiling == I915_TILING_Y;
+
+	return batch_offset(ss);
+}
+
+static uint32_t
+gen6_bind_surfaces(struct scratch_buf *src,
+		   struct scratch_buf *dst)
+{
+	uint32_t *binding_table;
+
+	binding_table = batch_alloc(32, 32);
+
+	binding_table[0] =
+		gen6_bind_buf(dst, GEN6_SURFACEFORMAT_B8G8R8A8_UNORM, 1);
+	binding_table[1] =
+		gen6_bind_buf(src, GEN6_SURFACEFORMAT_B8G8R8A8_UNORM, 0);
+
+	return batch_offset(binding_table);
+}
+
+static void
+gen6_emit_sip(void)
+{
+	OUT_BATCH(GEN6_STATE_SIP | 0);
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_urb(void)
+{
+	OUT_BATCH(GEN6_3DSTATE_URB | (3 - 2));
+	OUT_BATCH((1 - 1) << GEN6_3DSTATE_URB_VS_SIZE_SHIFT |
+		  24 << GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT); /* at least 24 on GEN6 */
+	OUT_BATCH(0 << GEN6_3DSTATE_URB_GS_SIZE_SHIFT |
+		  0 << GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT); /* no GS thread */
+}
+
+static void
+gen6_emit_state_base_address(void)
+{
+	OUT_BATCH(GEN6_STATE_BASE_ADDRESS | (10 - 2));
+	OUT_BATCH(0); /* general */
+	OUT_RELOC(batch->bo, /* surface */
+		  I915_GEM_DOMAIN_INSTRUCTION, 0,
+		  BASE_ADDRESS_MODIFY);
+	OUT_RELOC(batch->bo, /* instruction */
+		  I915_GEM_DOMAIN_INSTRUCTION, 0,
+		  BASE_ADDRESS_MODIFY);
+	OUT_BATCH(0); /* indirect */
+	OUT_RELOC(batch->bo, /* dynamic */
+		  I915_GEM_DOMAIN_INSTRUCTION, 0,
+		  BASE_ADDRESS_MODIFY);
+
+	/* upper bounds, disable */
+	OUT_BATCH(0);
+	OUT_BATCH(BASE_ADDRESS_MODIFY);
+	OUT_BATCH(0);
+	OUT_BATCH(BASE_ADDRESS_MODIFY);
+}
+
+static void
+gen6_emit_viewports(uint32_t cc_vp)
+{
+	OUT_BATCH(GEN6_3DSTATE_VIEWPORT_STATE_POINTERS |
+		  GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC |
+		  (4 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(cc_vp);
+}
+
+static void
+gen6_emit_vs(void)
+{
+	/* disable VS constant buffer */
+	OUT_BATCH(GEN6_3DSTATE_CONSTANT_VS | (5 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+
+	OUT_BATCH(GEN6_3DSTATE_VS | (6 - 2));
+	OUT_BATCH(0); /* no VS kernel */
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* pass-through */
+}
+
+static void
+gen6_emit_gs(void)
+{
+	/* disable GS constant buffer */
+	OUT_BATCH(GEN6_3DSTATE_CONSTANT_GS | (5 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+
+	OUT_BATCH(GEN6_3DSTATE_GS | (7 - 2));
+	OUT_BATCH(0); /* no GS kernel */
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* pass-through */
+}
+
+static void
+gen6_emit_clip(void)
+{
+	OUT_BATCH(GEN6_3DSTATE_CLIP | (4 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* pass-through */
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_wm_constants(void)
+{
+	/* disable WM constant buffer */
+	OUT_BATCH(GEN6_3DSTATE_CONSTANT_PS | (5 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_null_depth_buffer(void)
+{
+	OUT_BATCH(GEN6_3DSTATE_DEPTH_BUFFER | (7 - 2));
+	OUT_BATCH(GEN6_SURFACE_NULL << GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT |
+		  GEN6_DEPTHFORMAT_D32_FLOAT << GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+
+	OUT_BATCH(GEN6_3DSTATE_CLEAR_PARAMS | (2 - 2));
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_invariant(void)
+{
+	OUT_BATCH(GEN6_PIPELINE_SELECT | PIPELINE_SELECT_3D);
+
+	OUT_BATCH(GEN6_3DSTATE_MULTISAMPLE | (3 - 2));
+	OUT_BATCH(GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER |
+		  GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1); /* 1 sample/pixel */
+	OUT_BATCH(0);
+
+	OUT_BATCH(GEN6_3DSTATE_SAMPLE_MASK | (2 - 2));
+	OUT_BATCH(1);
+}
+
+static void
+gen6_emit_cc(uint32_t blend)
+{
+	OUT_BATCH(GEN6_3DSTATE_CC_STATE_POINTERS | (4 - 2));
+	OUT_BATCH(blend | 1);
+	OUT_BATCH(1024 | 1);
+	OUT_BATCH(1024 | 1);
+}
+
+static void
+gen6_emit_sampler(uint32_t state)
+{
+	OUT_BATCH(GEN6_3DSTATE_SAMPLER_STATE_POINTERS |
+		  GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS |
+		  (4 - 2));
+	OUT_BATCH(0); /* VS */
+	OUT_BATCH(0); /* GS */
+	OUT_BATCH(state);
+}
+
+static void
+gen6_emit_sf(void)
+{
+	OUT_BATCH(GEN6_3DSTATE_SF | (20 - 2));
+	OUT_BATCH(1 << GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT |
+		  1 << GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT |
+		  1 << GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT);
+	OUT_BATCH(0);
+	OUT_BATCH(GEN6_3DSTATE_SF_CULL_NONE);
+	OUT_BATCH(2 << GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT); /* DW4 */
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* DW9 */
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* DW14 */
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+	OUT_BATCH(0); /* DW19 */
+}
+
+static void
+gen6_emit_wm(int kernel)
+{
+	OUT_BATCH(GEN6_3DSTATE_WM | (9 - 2));
+	OUT_BATCH(kernel);
+	OUT_BATCH(1 << GEN6_3DSTATE_WM_SAMPLER_COUNT_SHIFT |
+		  2 << GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT);
+	OUT_BATCH(0);
+	OUT_BATCH(6 << GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT); /* DW4 */
+	OUT_BATCH((40 - 1) << GEN6_3DSTATE_WM_MAX_THREADS_SHIFT |
+		  GEN6_3DSTATE_WM_DISPATCH_ENABLE |
+		  GEN6_3DSTATE_WM_16_DISPATCH_ENABLE);
+	OUT_BATCH(1 << GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT |
+		  GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC);
+	OUT_BATCH(0);
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_binding_table(uint32_t wm_table)
+{
+	OUT_BATCH(GEN6_3DSTATE_BINDING_TABLE_POINTERS |
+		  GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS |
+		  (4 - 2));
+	OUT_BATCH(0);		/* vs */
+	OUT_BATCH(0);		/* gs */
+	OUT_BATCH(wm_table);
+}
+
+static void
+gen6_emit_drawing_rectangle(struct scratch_buf *dst)
+{
+	OUT_BATCH(GEN6_3DSTATE_DRAWING_RECTANGLE | (4 - 2));
+	OUT_BATCH(0);
+	OUT_BATCH((buf_height(dst) - 1) << 16 | (buf_width(dst) - 1));
+	OUT_BATCH(0);
+}
+
+static void
+gen6_emit_vertex_elements(void)
+{
+	/* The VUE layout
+	 *    dword 0-3: pad (0.0, 0.0, 0.0. 0.0)
+	 *    dword 4-7: position (x, y, 1.0, 1.0),
+	 *    dword 8-11: texture coordinate 0 (u0, v0, 0, 0)
+	 *
+	 * dword 4-11 are fetched from vertex buffer
+	 */
+	OUT_BATCH(GEN6_3DSTATE_VERTEX_ELEMENTS | (2 * 3 + 1 - 2));
+
+	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
+		  GEN6_SURFACEFORMAT_R32G32B32A32_FLOAT << VE0_FORMAT_SHIFT |
+		  0 << VE0_OFFSET_SHIFT);
+	OUT_BATCH(GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_0_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_1_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_2_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_3_SHIFT);
+
+	/* x,y */
+	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
+		  GEN6_SURFACEFORMAT_R16G16_SSCALED << VE0_FORMAT_SHIFT |
+		  0 << VE0_OFFSET_SHIFT); /* offsets vb in bytes */
+	OUT_BATCH(GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_0_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_1_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_1_FLT << VE1_VFCOMPONENT_2_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_1_FLT << VE1_VFCOMPONENT_3_SHIFT);
+
+	/* u0, v0 */
+	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
+		  GEN6_SURFACEFORMAT_R32G32_FLOAT << VE0_FORMAT_SHIFT |
+		  4 << VE0_OFFSET_SHIFT);	/* offset vb in bytes */
+	OUT_BATCH(GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_0_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_1_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_2_SHIFT |
+		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_3_SHIFT);
+}
+
+static uint32_t
+gen6_create_cc_viewport(void)
+{
+	struct gen6_cc_viewport *vp;
+
+	vp = batch_alloc(sizeof(*vp), 32);
+
+	vp->min_depth = -1.e35;
+	vp->max_depth = 1.e35;
+
+	return batch_offset(vp);
+}
+
+static uint32_t
+gen6_create_cc_blend(void)
+{
+	struct gen6_blend_state *blend;
+
+	blend = batch_alloc(sizeof(*blend), 64);
+
+	blend->blend0.dest_blend_factor = GEN6_BLENDFACTOR_ZERO;
+	blend->blend0.source_blend_factor = GEN6_BLENDFACTOR_ONE;
+	blend->blend0.blend_func = GEN6_BLENDFUNCTION_ADD;
+	blend->blend0.blend_enable = 1;
+
+	blend->blend1.post_blend_clamp_enable = 1;
+	blend->blend1.pre_blend_clamp_enable = 1;
+
+	return batch_offset(blend);
+}
+
+static uint32_t
+gen6_create_kernel(void)
+{
+	return batch_copy(ps_kernel_nomask_affine,
+			  sizeof(ps_kernel_nomask_affine),
+			  64);
+}
+
+static uint32_t
+gen6_create_sampler(sampler_filter_t filter,
+		   sampler_extend_t extend)
+{
+	struct gen6_sampler_state *ss;
+
+	ss = batch_alloc(sizeof(*ss), 32);
+	ss->ss0.lod_preclamp = 1;	/* GL mode */
+
+	/* We use the legacy mode to get the semantics specified by
+	 * the Render extension. */
+	ss->ss0.border_color_mode = GEN6_BORDER_COLOR_MODE_LEGACY;
+
+	switch (filter) {
+	default:
+	case SAMPLER_FILTER_NEAREST:
+		ss->ss0.min_filter = GEN6_MAPFILTER_NEAREST;
+		ss->ss0.mag_filter = GEN6_MAPFILTER_NEAREST;
+		break;
+	case SAMPLER_FILTER_BILINEAR:
+		ss->ss0.min_filter = GEN6_MAPFILTER_LINEAR;
+		ss->ss0.mag_filter = GEN6_MAPFILTER_LINEAR;
+		break;
+	}
+
+	switch (extend) {
+	default:
+	case SAMPLER_EXTEND_NONE:
+		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
+		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
+		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
+		break;
+	case SAMPLER_EXTEND_REPEAT:
+		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
+		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
+		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
+		break;
+	case SAMPLER_EXTEND_PAD:
+		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
+		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
+		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
+		break;
+	case SAMPLER_EXTEND_REFLECT:
+		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
+		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
+		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
+		break;
+	}
+
+	return batch_offset(ss);
+}
+
+static void gen6_emit_vertex_buffer(void)
+{
+	OUT_BATCH(GEN6_3DSTATE_VERTEX_BUFFERS | 3);
+	OUT_BATCH(VB0_VERTEXDATA |
+		  0 << VB0_BUFFER_INDEX_SHIFT |
+		  VERTEX_SIZE << VB0_BUFFER_PITCH_SHIFT);
+	OUT_RELOC(batch->bo, I915_GEM_DOMAIN_VERTEX, 0, 0);
+	OUT_RELOC(batch->bo, I915_GEM_DOMAIN_VERTEX, 0, batch->bo->size-1);
+	OUT_BATCH(0);
+}
+
+static uint32_t gen6_emit_primitive(void)
+{
+	uint32_t offset;
+
+	OUT_BATCH(GEN6_3DPRIMITIVE |
+		  GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL |
+		  _3DPRIM_RECTLIST << GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT |
+		  0 << 9 |
+		  4);
+	OUT_BATCH(3);	/* vertex count */
+	offset = batch_used();
+	OUT_BATCH(0);	/* vertex_index */
+	OUT_BATCH(1);	/* single instance */
+	OUT_BATCH(0);	/* start instance location */
+	OUT_BATCH(0);	/* index buffer offset, ignored */
+
+	return offset;
+}
+
+uint32_t
+gen6_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+		     struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+		     unsigned logical_tile_no)
+{
+	uint32_t wm_state, wm_kernel, wm_table;
+	uint32_t cc_vp, cc_blend, offset;
+	uint32_t batch_end;
+
+	batch->ptr = batch->buffer + 1024;
+	batch_alloc(64, 64);
+	wm_table  = gen6_bind_surfaces(src, dst);
+	wm_kernel = gen6_create_kernel();
+	wm_state  = gen6_create_sampler(SAMPLER_FILTER_NEAREST,
+					SAMPLER_EXTEND_NONE);
+
+	cc_vp = gen6_create_cc_viewport();
+	cc_blend = gen6_create_cc_blend();
+
+	batch->ptr = batch->buffer;
+
+	gen6_emit_invariant();
+	gen6_emit_state_base_address();
+
+	gen6_emit_sip();
+	gen6_emit_urb();
+
+	gen6_emit_viewports(cc_vp);
+	gen6_emit_vs();
+	gen6_emit_gs();
+	gen6_emit_clip();
+	gen6_emit_wm_constants();
+	gen6_emit_null_depth_buffer();
+
+	gen6_emit_drawing_rectangle(dst);
+	gen6_emit_cc(cc_blend);
+	gen6_emit_sampler(wm_state);
+	gen6_emit_sf();
+	gen6_emit_wm(wm_kernel);
+	gen6_emit_vertex_elements();
+	gen6_emit_binding_table(wm_table);
+
+	gen6_emit_vertex_buffer();
+	offset = gen6_emit_primitive();
+
+	OUT_BATCH(MI_BATCH_BUFFER_END);
+	batch_end = batch_align(8);
+
+	*(uint32_t*)(batch->buffer + offset) =
+		batch_round_upto(VERTEX_SIZE)/VERTEX_SIZE;
+
+	emit_vertex_2s(dst_x + options.tile_size, dst_y + options.tile_size);
+	emit_vertex_normalized(src_x + options.tile_size, buf_width(src));
+	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
+
+	emit_vertex_2s(dst_x, dst_y + options.tile_size);
+	emit_vertex_normalized(src_x, buf_width(src));
+	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
+
+	emit_vertex_2s(dst_x, dst_y);
+	emit_vertex_normalized(src_x, buf_width(src));
+	emit_vertex_normalized(src_y, buf_height(src));
+
+	return batch_end;
+}
diff --git a/lib/gem_stress_i830.c b/lib/gem_stress_i830.c
new file mode 100644
index 0000000..23547fc
--- /dev/null
+++ b/lib/gem_stress_i830.c
@@ -0,0 +1,354 @@
+#include "i830_reg.h"
+#include "gem_stress.h"
+
+#define TB0C_LAST_STAGE	(1 << 31)
+#define TB0C_RESULT_SCALE_1X		(0 << 29)
+#define TB0C_RESULT_SCALE_2X		(1 << 29)
+#define TB0C_RESULT_SCALE_4X		(2 << 29)
+#define TB0C_OP_MODULE			(3 << 25)
+#define TB0C_OUTPUT_WRITE_CURRENT	(0 << 24)
+#define TB0C_OUTPUT_WRITE_ACCUM		(1 << 24)
+#define TB0C_ARG3_REPLICATE_ALPHA 	(1<<23)
+#define TB0C_ARG3_INVERT		(1<<22)
+#define TB0C_ARG3_SEL_XXX
+#define TB0C_ARG2_REPLICATE_ALPHA 	(1<<17)
+#define TB0C_ARG2_INVERT		(1<<16)
+#define TB0C_ARG2_SEL_ONE		(0 << 12)
+#define TB0C_ARG2_SEL_FACTOR		(1 << 12)
+#define TB0C_ARG2_SEL_TEXEL0		(6 << 12)
+#define TB0C_ARG2_SEL_TEXEL1		(7 << 12)
+#define TB0C_ARG2_SEL_TEXEL2		(8 << 12)
+#define TB0C_ARG2_SEL_TEXEL3		(9 << 12)
+#define TB0C_ARG1_REPLICATE_ALPHA 	(1<<11)
+#define TB0C_ARG1_INVERT		(1<<10)
+#define TB0C_ARG1_SEL_ONE		(0 << 6)
+#define TB0C_ARG1_SEL_TEXEL0		(6 << 6)
+#define TB0C_ARG1_SEL_TEXEL1		(7 << 6)
+#define TB0C_ARG1_SEL_TEXEL2		(8 << 6)
+#define TB0C_ARG1_SEL_TEXEL3		(9 << 6)
+#define TB0C_ARG0_REPLICATE_ALPHA 	(1<<5)
+#define TB0C_ARG0_SEL_XXX
+
+#define TB0A_CTR_STAGE_ENABLE 		(1<<31)
+#define TB0A_RESULT_SCALE_1X		(0 << 29)
+#define TB0A_RESULT_SCALE_2X		(1 << 29)
+#define TB0A_RESULT_SCALE_4X		(2 << 29)
+#define TB0A_OP_MODULE			(3 << 25)
+#define TB0A_OUTPUT_WRITE_CURRENT	(0<<24)
+#define TB0A_OUTPUT_WRITE_ACCUM		(1<<24)
+#define TB0A_CTR_STAGE_SEL_BITS_XXX
+#define TB0A_ARG3_SEL_XXX
+#define TB0A_ARG3_INVERT		(1<<17)
+#define TB0A_ARG2_INVERT		(1<<16)
+#define TB0A_ARG2_SEL_ONE		(0 << 12)
+#define TB0A_ARG2_SEL_TEXEL0		(6 << 12)
+#define TB0A_ARG2_SEL_TEXEL1		(7 << 12)
+#define TB0A_ARG2_SEL_TEXEL2		(8 << 12)
+#define TB0A_ARG2_SEL_TEXEL3		(9 << 12)
+#define TB0A_ARG1_INVERT		(1<<10)
+#define TB0A_ARG1_SEL_ONE		(0 << 6)
+#define TB0A_ARG1_SEL_TEXEL0		(6 << 6)
+#define TB0A_ARG1_SEL_TEXEL1		(7 << 6)
+#define TB0A_ARG1_SEL_TEXEL2		(8 << 6)
+#define TB0A_ARG1_SEL_TEXEL3		(9 << 6)
+
+uint32_t gen2_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+			      struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+			      unsigned logical_tile_no)
+{
+	static unsigned keep_gpu_busy_counter = 0;
+
+	/* check both edges of the fence usage */
+	if (keep_gpu_busy_counter & 1)
+		keep_gpu_busy();
+
+	/* invariant state */
+	{
+		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(0));
+		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(1));
+		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(2));
+		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(3));
+
+		OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_DFLT_Z_CMD);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_FOG_MODE_CMD);
+		OUT_BATCH(FOGFUNC_ENABLE |
+			  FOG_LINEAR_CONST | FOGSRC_INDEX_Z | ENABLE_FOG_DENSITY);
+		OUT_BATCH(0);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
+			  MAP_UNIT(0) |
+			  DISABLE_TEX_STREAM_BUMP |
+			  ENABLE_TEX_STREAM_COORD_SET |
+			  TEX_STREAM_COORD_SET(0) |
+			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(0));
+		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
+			  MAP_UNIT(1) |
+			  DISABLE_TEX_STREAM_BUMP |
+			  ENABLE_TEX_STREAM_COORD_SET |
+			  TEX_STREAM_COORD_SET(1) |
+			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(1));
+		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
+			  MAP_UNIT(2) |
+			  DISABLE_TEX_STREAM_BUMP |
+			  ENABLE_TEX_STREAM_COORD_SET |
+			  TEX_STREAM_COORD_SET(2) |
+			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(2));
+		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
+			  MAP_UNIT(3) |
+			  DISABLE_TEX_STREAM_BUMP |
+			  ENABLE_TEX_STREAM_COORD_SET |
+			  TEX_STREAM_COORD_SET(3) |
+			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(3));
+
+		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
+		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(0));
+		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
+		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(1));
+		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
+		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(2));
+		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
+		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(3));
+
+		OUT_BATCH(_3DSTATE_RASTER_RULES_CMD |
+			  ENABLE_POINT_RASTER_RULE |
+			  OGL_POINT_RASTER_RULE |
+			  ENABLE_LINE_STRIP_PROVOKE_VRTX |
+			  ENABLE_TRI_FAN_PROVOKE_VRTX |
+			  ENABLE_TRI_STRIP_PROVOKE_VRTX |
+			  LINE_STRIP_PROVOKE_VRTX(1) |
+			  TRI_FAN_PROVOKE_VRTX(2) | TRI_STRIP_PROVOKE_VRTX(2));
+
+		OUT_BATCH(_3DSTATE_SCISSOR_ENABLE_CMD | DISABLE_SCISSOR_RECT);
+
+		OUT_BATCH(_3DSTATE_SCISSOR_RECT_0_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_VERTEX_TRANSFORM);
+		OUT_BATCH(DISABLE_VIEWPORT_TRANSFORM | DISABLE_PERSPECTIVE_DIVIDE);
+
+		OUT_BATCH(_3DSTATE_W_STATE_CMD);
+		OUT_BATCH(MAGIC_W_STATE_DWORD1);
+		OUT_BATCH(0x3f800000 /* 1.0 in IEEE float */ );
+
+		OUT_BATCH(_3DSTATE_COLOR_FACTOR_CMD);
+		OUT_BATCH(0x80808080);	/* .5 required in alpha for GL_DOT3_RGBA_EXT */
+
+		OUT_BATCH(_3DSTATE_MAP_COORD_SETBIND_CMD);
+		OUT_BATCH(TEXBIND_SET3(TEXCOORDSRC_VTXSET_3) |
+			  TEXBIND_SET2(TEXCOORDSRC_VTXSET_2) |
+			  TEXBIND_SET1(TEXCOORDSRC_VTXSET_1) |
+			  TEXBIND_SET0(TEXCOORDSRC_VTXSET_0));
+
+		/* copy from mesa */
+		OUT_BATCH(_3DSTATE_FOG_COLOR_CMD |
+			  FOG_COLOR_RED(0) | FOG_COLOR_GREEN(0) | FOG_COLOR_BLUE(0));
+
+		OUT_BATCH(_3DSTATE_CONST_BLEND_COLOR_CMD);
+		OUT_BATCH(0);
+
+		OUT_BATCH(_3DSTATE_MODES_1_CMD |
+			  ENABLE_COLR_BLND_FUNC |
+			  BLENDFUNC_ADD |
+			  ENABLE_SRC_BLND_FACTOR |
+			  SRC_BLND_FACT(BLENDFACTOR_ONE) |
+			  ENABLE_DST_BLND_FACTOR | DST_BLND_FACT(BLENDFACTOR_ZERO));
+		OUT_BATCH(_3DSTATE_MODES_2_CMD | ENABLE_GLOBAL_DEPTH_BIAS | GLOBAL_DEPTH_BIAS(0) | ENABLE_ALPHA_TEST_FUNC | ALPHA_TEST_FUNC(0) |	/* always */
+			  ALPHA_REF_VALUE(0));
+		OUT_BATCH(_3DSTATE_MODES_3_CMD |
+			  ENABLE_DEPTH_TEST_FUNC |
+			  DEPTH_TEST_FUNC(0x2) |	/* COMPAREFUNC_LESS */
+			  ENABLE_ALPHA_SHADE_MODE |
+			  ALPHA_SHADE_MODE(SHADE_MODE_LINEAR) |
+			  ENABLE_FOG_SHADE_MODE |
+			  FOG_SHADE_MODE(SHADE_MODE_LINEAR) |
+			  ENABLE_SPEC_SHADE_MODE |
+			  SPEC_SHADE_MODE(SHADE_MODE_LINEAR) |
+			  ENABLE_COLOR_SHADE_MODE |
+			  COLOR_SHADE_MODE(SHADE_MODE_LINEAR) |
+			  ENABLE_CULL_MODE | CULLMODE_NONE);
+
+		OUT_BATCH(_3DSTATE_MODES_4_CMD |
+			  ENABLE_LOGIC_OP_FUNC |
+			  LOGIC_OP_FUNC(LOGICOP_COPY) |
+			  ENABLE_STENCIL_TEST_MASK |
+			  STENCIL_TEST_MASK(0xff) |
+			  ENABLE_STENCIL_WRITE_MASK | STENCIL_WRITE_MASK(0xff));
+
+		OUT_BATCH(_3DSTATE_STENCIL_TEST_CMD |
+			  ENABLE_STENCIL_PARMS |
+			  STENCIL_FAIL_OP(0) |	/* STENCILOP_KEEP */
+			  STENCIL_PASS_DEPTH_FAIL_OP(0) |	/* STENCILOP_KEEP */
+			  STENCIL_PASS_DEPTH_PASS_OP(0) |	/* STENCILOP_KEEP */
+			  ENABLE_STENCIL_TEST_FUNC |
+			  STENCIL_TEST_FUNC(0) |	/* COMPAREFUNC_ALWAYS */
+			  ENABLE_STENCIL_REF_VALUE |
+			  STENCIL_REF_VALUE(0));
+
+		OUT_BATCH(_3DSTATE_MODES_5_CMD |
+			  FLUSH_TEXTURE_CACHE |
+			  ENABLE_SPRITE_POINT_TEX | SPRITE_POINT_TEX_OFF |
+			  ENABLE_FIXED_LINE_WIDTH | FIXED_LINE_WIDTH(0x2) | /* 1.0 */
+			  ENABLE_FIXED_POINT_WIDTH | FIXED_POINT_WIDTH(1));
+
+		OUT_BATCH(_3DSTATE_STIPPLE);
+
+		/* Set default blend state */
+		OUT_BATCH(_3DSTATE_MAP_BLEND_OP_CMD(0) |
+			  TEXPIPE_COLOR |
+			  ENABLE_TEXOUTPUT_WRT_SEL |
+			  TEXOP_OUTPUT_CURRENT |
+			  DISABLE_TEX_CNTRL_STAGE |
+			  TEXOP_SCALE_1X |
+			  TEXOP_MODIFY_PARMS | TEXOP_LAST_STAGE | TEXBLENDOP_ARG1);
+		OUT_BATCH(_3DSTATE_MAP_BLEND_OP_CMD(0) |
+			  TEXPIPE_ALPHA |
+			  ENABLE_TEXOUTPUT_WRT_SEL |
+			  TEXOP_OUTPUT_CURRENT |
+			  TEXOP_SCALE_1X | TEXOP_MODIFY_PARMS | TEXBLENDOP_ARG1);
+		OUT_BATCH(_3DSTATE_MAP_BLEND_ARG_CMD(0) |
+			  TEXPIPE_COLOR |
+			  TEXBLEND_ARG1 |
+			  TEXBLENDARG_MODIFY_PARMS | TEXBLENDARG_DIFFUSE);
+		OUT_BATCH(_3DSTATE_MAP_BLEND_ARG_CMD(0) |
+			  TEXPIPE_ALPHA |
+			  TEXBLEND_ARG1 |
+			  TEXBLENDARG_MODIFY_PARMS | TEXBLENDARG_DIFFUSE);
+
+		OUT_BATCH(_3DSTATE_AA_CMD |
+			  AA_LINE_ECAAR_WIDTH_ENABLE |
+			  AA_LINE_ECAAR_WIDTH_1_0 |
+			  AA_LINE_REGION_WIDTH_ENABLE |
+			  AA_LINE_REGION_WIDTH_1_0 | AA_LINE_DISABLE);
+	}
+
+	/* render target state */
+	{
+		uint32_t tiling_bits = 0;
+		if (dst->tiling != I915_TILING_NONE)
+			tiling_bits = BUF_3D_TILED_SURFACE;
+		if (dst->tiling == I915_TILING_Y)
+			tiling_bits |= BUF_3D_TILE_WALK_Y;
+
+		OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
+		OUT_BATCH(BUF_3D_ID_COLOR_BACK | tiling_bits |
+			  BUF_3D_PITCH(dst->stride));
+		OUT_RELOC(dst->bo, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, 0);
+
+		OUT_BATCH(_3DSTATE_DST_BUF_VARS_CMD);
+		OUT_BATCH(COLR_BUF_ARGB8888 |
+			  DSTORG_HORT_BIAS(0x8) |
+			  DSTORG_VERT_BIAS(0x8));
+
+		OUT_BATCH(_3DSTATE_DRAW_RECT_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(0);		/* ymin, xmin */
+		OUT_BATCH(DRAW_YMAX(buf_height(dst) - 1) |
+			  DRAW_XMAX(buf_width(dst) - 1));
+		OUT_BATCH(0);		/* yorig, xorig */
+	}
+
+	/* dynamic state */
+	{
+		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 |
+			  I1_LOAD_S(2) | I1_LOAD_S(3) | I1_LOAD_S(8) | 2);
+		OUT_BATCH(1);		/* number of coordinate sets */
+		OUT_BATCH(S3_CULLMODE_NONE | S3_VERTEXHAS_XY);
+		OUT_BATCH(S8_ENABLE_COLOR_BLEND | S8_BLENDFUNC_ADD |
+			  BLENDFACTOR_ONE << S8_SRC_BLEND_FACTOR_SHIFT |
+			  BLENDFACTOR_ZERO << S8_DST_BLEND_FACTOR_SHIFT |
+			  S8_ENABLE_COLOR_BUFFER_WRITE);
+
+		OUT_BATCH(_3DSTATE_INDPT_ALPHA_BLEND_CMD | DISABLE_INDPT_ALPHA_BLEND);
+
+		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_2 |
+			  LOAD_TEXTURE_BLEND_STAGE(0) | 1);
+		OUT_BATCH(TB0C_LAST_STAGE | TB0C_RESULT_SCALE_1X | TB0C_OP_MODULE |
+			  TB0C_OUTPUT_WRITE_CURRENT | TB0C_ARG1_SEL_TEXEL0 |
+			  TB0C_ARG2_SEL_ONE);
+		OUT_BATCH(TB0A_RESULT_SCALE_1X | TB0A_OP_MODULE |
+			  TB0A_OUTPUT_WRITE_CURRENT | TB0A_ARG1_SEL_TEXEL0 |
+			  TB0A_ARG2_SEL_ONE);
+
+		OUT_BATCH(_3DSTATE_ENABLES_1_CMD | DISABLE_LOGIC_OP |
+			  DISABLE_STENCIL_TEST | DISABLE_DEPTH_BIAS |
+			  DISABLE_SPEC_ADD | DISABLE_FOG | DISABLE_ALPHA_TEST |
+			  ENABLE_COLOR_BLEND | DISABLE_DEPTH_TEST);
+		/* We have to explicitly say we don't want write disabled */
+		OUT_BATCH(_3DSTATE_ENABLES_2_CMD | ENABLE_COLOR_MASK |
+			  DISABLE_STENCIL_WRITE | ENABLE_TEX_CACHE |
+			  DISABLE_DITHER | ENABLE_COLOR_WRITE | DISABLE_DEPTH_WRITE);
+
+		OUT_BATCH(_3DSTATE_VERTEX_FORMAT_2_CMD |
+			  TEXCOORDFMT_2D << 0);
+	}
+
+	/* sampler state */
+	{
+		uint32_t tiling_bits = 0;
+		if (src->tiling != I915_TILING_NONE)
+			tiling_bits = TM0S1_TILED_SURFACE;
+		if (src->tiling == I915_TILING_Y)
+			tiling_bits |= TM0S1_TILE_WALK;
+
+		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_2 |
+			  LOAD_TEXTURE_MAP(0) | 4);
+		OUT_RELOC(src->bo, I915_GEM_DOMAIN_SAMPLER, 0, 0);
+		OUT_BATCH((buf_height(src) - 1) << TM0S1_HEIGHT_SHIFT |
+			  (buf_width(src) - 1) << TM0S1_WIDTH_SHIFT |
+			  MAPSURF_32BIT | MT_32BIT_ARGB8888 | tiling_bits);
+		OUT_BATCH((src->stride / 4 - 1) << TM0S2_PITCH_SHIFT | TM0S2_MAP_2D);
+		OUT_BATCH(FILTER_NEAREST << TM0S3_MAG_FILTER_SHIFT |
+			  FILTER_NEAREST << TM0S3_MIN_FILTER_SHIFT |
+			  MIPFILTER_NONE << TM0S3_MIP_FILTER_SHIFT);
+		OUT_BATCH(0);	/* default color */
+		OUT_BATCH(_3DSTATE_MAP_COORD_SET_CMD | TEXCOORD_SET(0) |
+			  ENABLE_TEXCOORD_PARAMS | TEXCOORDS_ARE_NORMAL |
+			  TEXCOORDTYPE_CARTESIAN |
+			  ENABLE_ADDR_V_CNTL | TEXCOORD_ADDR_V_MODE(TEXCOORDMODE_CLAMP_BORDER) |
+			  ENABLE_ADDR_U_CNTL | TEXCOORD_ADDR_U_MODE(TEXCOORDMODE_CLAMP_BORDER));
+		/* map texel stream */
+		OUT_BATCH(_3DSTATE_MAP_COORD_SETBIND_CMD);
+		OUT_BATCH(TEXBIND_SET0(TEXCOORDSRC_VTXSET_0) |
+			  TEXBIND_SET1(TEXCOORDSRC_KEEP) |
+			  TEXBIND_SET2(TEXCOORDSRC_KEEP) |
+			  TEXBIND_SET3(TEXCOORDSRC_KEEP));
+		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD | (0 << 16) |
+			  DISABLE_TEX_STREAM_BUMP |
+			  ENABLE_TEX_STREAM_COORD_SET |
+			  TEX_STREAM_COORD_SET(0) |
+			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(0));
+	}
+
+	OUT_BATCH(PRIM3D_INLINE | PRIM3D_RECTLIST | (3*4 -1));
+	emit_vertex(dst_x + options.tile_size);
+	emit_vertex(dst_y + options.tile_size);
+	emit_vertex_normalized(src_x + options.tile_size, buf_width(src));
+	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
+
+	emit_vertex(dst_x);
+	emit_vertex(dst_y + options.tile_size);
+	emit_vertex_normalized(src_x, buf_width(src));
+	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
+
+	emit_vertex(dst_x);
+	emit_vertex(dst_y);
+	emit_vertex_normalized(src_x, buf_width(src));
+	emit_vertex_normalized(src_y, buf_height(src));
+
+	if (!(keep_gpu_busy_counter & 1))
+		keep_gpu_busy();
+
+	keep_gpu_busy_counter++;
+
+	return 0;
+}
diff --git a/lib/gem_stress_i915.c b/lib/gem_stress_i915.c
new file mode 100644
index 0000000..55e9ae8
--- /dev/null
+++ b/lib/gem_stress_i915.c
@@ -0,0 +1,190 @@
+#include "i915_reg.h"
+#include "i915_3d.h"
+#include "gem_stress.h"
+
+uint32_t gen3_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
+			      struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
+			      unsigned logical_tile_no)
+{
+	static unsigned keep_gpu_busy_counter = 0;
+
+	/* check both edges of the fence usage */
+	if (keep_gpu_busy_counter & 1)
+		keep_gpu_busy();
+
+	/* invariant state */
+	{
+		OUT_BATCH(_3DSTATE_AA_CMD |
+			  AA_LINE_ECAAR_WIDTH_ENABLE |
+			  AA_LINE_ECAAR_WIDTH_1_0 |
+			  AA_LINE_REGION_WIDTH_ENABLE | AA_LINE_REGION_WIDTH_1_0);
+		OUT_BATCH(_3DSTATE_INDEPENDENT_ALPHA_BLEND_CMD |
+			  IAB_MODIFY_ENABLE |
+			  IAB_MODIFY_FUNC | (BLENDFUNC_ADD << IAB_FUNC_SHIFT) |
+			  IAB_MODIFY_SRC_FACTOR | (BLENDFACT_ONE <<
+						   IAB_SRC_FACTOR_SHIFT) |
+			  IAB_MODIFY_DST_FACTOR | (BLENDFACT_ZERO <<
+						   IAB_DST_FACTOR_SHIFT));
+		OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(_3DSTATE_DFLT_Z_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(_3DSTATE_COORD_SET_BINDINGS |
+			  CSB_TCB(0, 0) |
+			  CSB_TCB(1, 1) |
+			  CSB_TCB(2, 2) |
+			  CSB_TCB(3, 3) |
+			  CSB_TCB(4, 4) |
+			  CSB_TCB(5, 5) | CSB_TCB(6, 6) | CSB_TCB(7, 7));
+		OUT_BATCH(_3DSTATE_RASTER_RULES_CMD |
+			  ENABLE_POINT_RASTER_RULE |
+			  OGL_POINT_RASTER_RULE |
+			  ENABLE_LINE_STRIP_PROVOKE_VRTX |
+			  ENABLE_TRI_FAN_PROVOKE_VRTX |
+			  LINE_STRIP_PROVOKE_VRTX(1) |
+			  TRI_FAN_PROVOKE_VRTX(2) | ENABLE_TEXKILL_3D_4D | TEXKILL_4D);
+		OUT_BATCH(_3DSTATE_MODES_4_CMD |
+			  ENABLE_LOGIC_OP_FUNC | LOGIC_OP_FUNC(LOGICOP_COPY) |
+			  ENABLE_STENCIL_WRITE_MASK | STENCIL_WRITE_MASK(0xff) |
+			  ENABLE_STENCIL_TEST_MASK | STENCIL_TEST_MASK(0xff));
+		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 | I1_LOAD_S(3) | I1_LOAD_S(4) | I1_LOAD_S(5) | 2);
+		OUT_BATCH(0x00000000);	/* Disable texture coordinate wrap-shortest */
+		OUT_BATCH((1 << S4_POINT_WIDTH_SHIFT) |
+			  S4_LINE_WIDTH_ONE |
+			  S4_CULLMODE_NONE |
+			  S4_VFMT_XY);
+		OUT_BATCH(0x00000000);	/* Stencil. */
+		OUT_BATCH(_3DSTATE_SCISSOR_ENABLE_CMD | DISABLE_SCISSOR_RECT);
+		OUT_BATCH(_3DSTATE_SCISSOR_RECT_0_CMD);
+		OUT_BATCH(0);
+		OUT_BATCH(0);
+		OUT_BATCH(_3DSTATE_DEPTH_SUBRECT_DISABLE);
+		OUT_BATCH(_3DSTATE_LOAD_INDIRECT | 0);	/* disable indirect state */
+		OUT_BATCH(0);
+		OUT_BATCH(_3DSTATE_STIPPLE);
+		OUT_BATCH(0x00000000);
+		OUT_BATCH(_3DSTATE_BACKFACE_STENCIL_OPS | BFO_ENABLE_STENCIL_TWO_SIDE | 0);
+	}
+
+	/* samler state */
+	{
+#define TEX_COUNT 1
+		uint32_t tiling_bits = 0;
+		if (src->tiling != I915_TILING_NONE)
+			tiling_bits = MS3_TILED_SURFACE;
+		if (src->tiling == I915_TILING_Y)
+			tiling_bits |= MS3_TILE_WALK;
+
+		OUT_BATCH(_3DSTATE_MAP_STATE | (3 * TEX_COUNT));
+		OUT_BATCH((1 << TEX_COUNT) - 1);
+		OUT_RELOC(src->bo, I915_GEM_DOMAIN_SAMPLER, 0, 0);
+		OUT_BATCH(MAPSURF_32BIT | MT_32BIT_ARGB8888 |
+			  tiling_bits |
+			  (buf_height(src) - 1) << MS3_HEIGHT_SHIFT |
+			  (buf_width(src) - 1) << MS3_WIDTH_SHIFT);
+		OUT_BATCH((src->stride/4-1) << MS4_PITCH_SHIFT);
+
+		OUT_BATCH(_3DSTATE_SAMPLER_STATE | (3 * TEX_COUNT));
+		OUT_BATCH((1 << TEX_COUNT) - 1);
+		OUT_BATCH(MIPFILTER_NONE << SS2_MIP_FILTER_SHIFT |
+			  FILTER_NEAREST << SS2_MAG_FILTER_SHIFT |
+			  FILTER_NEAREST << SS2_MIN_FILTER_SHIFT);
+		OUT_BATCH(TEXCOORDMODE_WRAP << SS3_TCX_ADDR_MODE_SHIFT |
+			  TEXCOORDMODE_WRAP << SS3_TCY_ADDR_MODE_SHIFT |
+			  0 << SS3_TEXTUREMAP_INDEX_SHIFT);
+		OUT_BATCH(0x00000000);
+	}
+
+	/* render target state */
+	{
+		uint32_t tiling_bits = 0;
+		if (dst->tiling != I915_TILING_NONE)
+			tiling_bits = BUF_3D_TILED_SURFACE;
+		if (dst->tiling == I915_TILING_Y)
+			tiling_bits |= BUF_3D_TILE_WALK_Y;
+
+		OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
+		OUT_BATCH(BUF_3D_ID_COLOR_BACK | tiling_bits |
+			  BUF_3D_PITCH(dst->stride));
+		OUT_RELOC(dst->bo, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, 0);
+
+		OUT_BATCH(_3DSTATE_DST_BUF_VARS_CMD);
+		OUT_BATCH(COLR_BUF_ARGB8888 |
+			  DSTORG_HORT_BIAS(0x8) |
+			  DSTORG_VERT_BIAS(0x8));
+
+		/* draw rect is unconditional */
+		OUT_BATCH(_3DSTATE_DRAW_RECT_CMD);
+		OUT_BATCH(0x00000000);
+		OUT_BATCH(0x00000000);	/* ymin, xmin */
+		OUT_BATCH(DRAW_YMAX(buf_height(dst) - 1) |
+			  DRAW_XMAX(buf_width(dst) - 1));
+		/* yorig, xorig (relate to color buffer?) */
+		OUT_BATCH(0x00000000);
+	}
+
+	/* texfmt */
+	{
+		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 |
+			  I1_LOAD_S(1) | I1_LOAD_S(2) | I1_LOAD_S(6) | 2);
+		OUT_BATCH((4 << S1_VERTEX_WIDTH_SHIFT) |
+			  (4 << S1_VERTEX_PITCH_SHIFT));
+		OUT_BATCH(~S2_TEXCOORD_FMT(0, TEXCOORDFMT_NOT_PRESENT) | S2_TEXCOORD_FMT(0, TEXCOORDFMT_2D));
+		OUT_BATCH(S6_CBUF_BLEND_ENABLE | S6_COLOR_WRITE_ENABLE |
+			  BLENDFUNC_ADD << S6_CBUF_BLEND_FUNC_SHIFT |
+			  BLENDFACT_ONE << S6_CBUF_SRC_BLEND_FACT_SHIFT |
+			  BLENDFACT_ZERO << S6_CBUF_DST_BLEND_FACT_SHIFT);
+	}
+
+	/* frage shader */
+	{
+		OUT_BATCH(_3DSTATE_PIXEL_SHADER_PROGRAM | (1 + 3*3 - 2));
+		/* decl FS_T0 */
+		OUT_BATCH(D0_DCL |
+			  REG_TYPE(FS_T0) << D0_TYPE_SHIFT |
+			  REG_NR(FS_T0) << D0_NR_SHIFT |
+			  ((REG_TYPE(FS_T0) != REG_TYPE_S) ? D0_CHANNEL_ALL : 0));
+		OUT_BATCH(0);
+		OUT_BATCH(0);
+		/* decl FS_S0 */
+		OUT_BATCH(D0_DCL |
+			  (REG_TYPE(FS_S0) << D0_TYPE_SHIFT) |
+			  (REG_NR(FS_S0) << D0_NR_SHIFT) |
+			  ((REG_TYPE(FS_S0) != REG_TYPE_S) ? D0_CHANNEL_ALL : 0));
+		OUT_BATCH(0);
+		OUT_BATCH(0);
+		/* texld(FS_OC, FS_S0, FS_T0 */
+		OUT_BATCH(T0_TEXLD |
+			  (REG_TYPE(FS_OC) << T0_DEST_TYPE_SHIFT) |
+			  (REG_NR(FS_OC) << T0_DEST_NR_SHIFT) |
+			  (REG_NR(FS_S0) << T0_SAMPLER_NR_SHIFT));
+		OUT_BATCH((REG_TYPE(FS_T0) << T1_ADDRESS_REG_TYPE_SHIFT) |
+			  (REG_NR(FS_T0) << T1_ADDRESS_REG_NR_SHIFT));
+		OUT_BATCH(0);
+	}
+
+	OUT_BATCH(PRIM3D_RECTLIST | (3*4 - 1));
+	emit_vertex(dst_x + options.tile_size);
+	emit_vertex(dst_y + options.tile_size);
+	emit_vertex(src_x + options.tile_size);
+	emit_vertex(src_y + options.tile_size);
+
+	emit_vertex(dst_x);
+	emit_vertex(dst_y + options.tile_size);
+	emit_vertex(src_x);
+	emit_vertex(src_y + options.tile_size);
+
+	emit_vertex(dst_x);
+	emit_vertex(dst_y);
+	emit_vertex(src_x);
+	emit_vertex(src_y);
+
+	if (!(keep_gpu_busy_counter & 1))
+		keep_gpu_busy();
+
+	keep_gpu_busy_counter++;
+
+	return 0;
+}
diff --git a/lib/gen6_render.h b/lib/gen6_render.h
new file mode 100644
index 0000000..2c63c9e
--- /dev/null
+++ b/lib/gen6_render.h
@@ -0,0 +1,1553 @@
+#ifndef GEN6_RENDER_H
+#define GEN6_RENDER_H
+
+#define GEN6_3D(Pipeline,Opcode,Subopcode) ((3 << 29) | \
+					   ((Pipeline) << 27) | \
+					   ((Opcode) << 24) | \
+					   ((Subopcode) << 16))
+
+#define GEN6_STATE_BASE_ADDRESS			GEN6_3D(0, 1, 1)
+#define GEN6_STATE_SIP				GEN6_3D(0, 1, 2)
+
+#define GEN6_PIPELINE_SELECT			GEN6_3D(1, 1, 4)
+
+#define GEN6_MEDIA_STATE_POINTERS		GEN6_3D(2, 0, 0)
+#define GEN6_MEDIA_OBJECT			GEN6_3D(2, 1, 0)
+
+#define GEN6_3DSTATE_BINDING_TABLE_POINTERS	GEN6_3D(3, 0, 1)
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS  (1 << 12)/* for GEN6 */
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_GS  (1 << 9) /* for GEN6 */
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_VS  (1 << 8) /* for GEN6 */
+
+#define GEN6_3DSTATE_VERTEX_BUFFERS		GEN6_3D(3, 0, 8)
+#define GEN6_3DSTATE_VERTEX_ELEMENTS		GEN6_3D(3, 0, 9)
+#define GEN6_3DSTATE_INDEX_BUFFER		GEN6_3D(3, 0, 0xa)
+#define GEN6_3DSTATE_VF_STATISTICS		GEN6_3D(3, 0, 0xb)
+
+#define GEN6_3DSTATE_DRAWING_RECTANGLE		GEN6_3D(3, 1, 0)
+#define GEN6_3DSTATE_CONSTANT_COLOR		GEN6_3D(3, 1, 1)
+#define GEN6_3DSTATE_SAMPLER_PALETTE_LOAD	GEN6_3D(3, 1, 2)
+#define GEN6_3DSTATE_CHROMA_KEY			GEN6_3D(3, 1, 4)
+#define GEN6_3DSTATE_DEPTH_BUFFER		GEN6_3D(3, 1, 5)
+# define GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT	29
+# define GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT	18
+
+#define GEN6_3DSTATE_POLY_STIPPLE_OFFSET		GEN6_3D(3, 1, 6)
+#define GEN6_3DSTATE_POLY_STIPPLE_PATTERN	GEN6_3D(3, 1, 7)
+#define GEN6_3DSTATE_LINE_STIPPLE		GEN6_3D(3, 1, 8)
+#define GEN6_3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP	GEN6_3D(3, 1, 9)
+/* These two are BLC and CTG only, not BW or CL */
+#define GEN6_3DSTATE_AA_LINE_PARAMS		GEN6_3D(3, 1, 0xa)
+#define GEN6_3DSTATE_GS_SVB_INDEX		GEN6_3D(3, 1, 0xb)
+
+#define GEN6_3DPRIMITIVE				GEN6_3D(3, 3, 0)
+
+#define GEN6_3DSTATE_CLEAR_PARAMS		GEN6_3D(3, 1, 0x10)
+/* DW1 */
+# define GEN6_3DSTATE_DEPTH_CLEAR_VALID		(1 << 15)
+
+#define GEN6_3DSTATE_SAMPLER_STATE_POINTERS	GEN6_3D(3, 0, 0x02)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS	(1 << 12)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_GS	(1 << 9)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_VS	(1 << 8)
+
+#define GEN6_3DSTATE_URB			GEN6_3D(3, 0, 0x05)
+/* DW1 */
+# define GEN6_3DSTATE_URB_VS_SIZE_SHIFT		16
+# define GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT	0
+/* DW2 */
+# define GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT	8
+# define GEN6_3DSTATE_URB_GS_SIZE_SHIFT		0
+
+#define GEN6_3DSTATE_VIEWPORT_STATE_POINTERS	GEN6_3D(3, 0, 0x0d)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC		(1 << 12)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_SF		(1 << 11)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CLIP	(1 << 10)
+
+#define GEN6_3DSTATE_CC_STATE_POINTERS		GEN6_3D(3, 0, 0x0e)
+
+#define GEN6_3DSTATE_VS				GEN6_3D(3, 0, 0x10)
+
+#define GEN6_3DSTATE_GS				GEN6_3D(3, 0, 0x11)
+/* DW4 */
+# define GEN6_3DSTATE_GS_DISPATCH_START_GRF_SHIFT	0
+
+#define GEN6_3DSTATE_CLIP			GEN6_3D(3, 0, 0x12)
+
+#define GEN6_3DSTATE_SF				GEN6_3D(3, 0, 0x13)
+/* DW1 */
+# define GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT		22
+# define GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT	11
+# define GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT	4
+/* DW2 */
+/* DW3 */
+# define GEN6_3DSTATE_SF_CULL_BOTH			(0 << 29)
+# define GEN6_3DSTATE_SF_CULL_NONE			(1 << 29)
+# define GEN6_3DSTATE_SF_CULL_FRONT			(2 << 29)
+# define GEN6_3DSTATE_SF_CULL_BACK			(3 << 29)
+/* DW4 */
+# define GEN6_3DSTATE_SF_TRI_PROVOKE_SHIFT		29
+# define GEN6_3DSTATE_SF_LINE_PROVOKE_SHIFT		27
+# define GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT		25
+
+#define GEN6_3DSTATE_WM				GEN6_3D(3, 0, 0x14)
+/* DW2 */
+# define GEN6_3DSTATE_WM_SAMPLER_COUNT_SHIFT			27
+# define GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT	18
+/* DW4 */
+# define GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT		16
+/* DW5 */
+# define GEN6_3DSTATE_WM_MAX_THREADS_SHIFT			25
+# define GEN6_3DSTATE_WM_DISPATCH_ENABLE			(1 << 19)
+# define GEN6_3DSTATE_WM_16_DISPATCH_ENABLE			(1 << 1)
+# define GEN6_3DSTATE_WM_8_DISPATCH_ENABLE			(1 << 0)
+/* DW6 */
+# define GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT			20
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC	(1 << 15)
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 14)
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC	(1 << 13)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC		(1 << 12)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 11)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC		(1 << 10)
+
+
+#define GEN6_3DSTATE_CONSTANT_VS		GEN6_3D(3, 0, 0x15)
+#define GEN6_3DSTATE_CONSTANT_GS		GEN6_3D(3, 0, 0x16)
+#define GEN6_3DSTATE_CONSTANT_PS		GEN6_3D(3, 0, 0x17)
+
+#define GEN6_3DSTATE_SAMPLE_MASK		GEN6_3D(3, 0, 0x18)
+
+#define GEN6_3DSTATE_MULTISAMPLE		GEN6_3D(3, 1, 0x0d)
+/* DW1 */
+# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER		(0 << 4)
+# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_UPPER_LEFT	(1 << 4)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1			(0 << 1)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_4			(2 << 1)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_8			(3 << 1)
+
+#define PIPELINE_SELECT_3D		0
+#define PIPELINE_SELECT_MEDIA		1
+
+/* for GEN6_STATE_BASE_ADDRESS */
+#define BASE_ADDRESS_MODIFY		(1 << 0)
+
+/* for GEN6_PIPE_CONTROL */
+#define GEN6_PIPE_CONTROL_NOWRITE       (0 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_QWORD   (1 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_DEPTH   (2 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_TIME    (3 << 14)
+#define GEN6_PIPE_CONTROL_DEPTH_STALL   (1 << 13)
+#define GEN6_PIPE_CONTROL_WC_FLUSH      (1 << 12)
+#define GEN6_PIPE_CONTROL_IS_FLUSH      (1 << 11)
+#define GEN6_PIPE_CONTROL_TC_FLUSH      (1 << 10)
+#define GEN6_PIPE_CONTROL_NOTIFY_ENABLE (1 << 8)
+#define GEN6_PIPE_CONTROL_GLOBAL_GTT    (1 << 2)
+#define GEN6_PIPE_CONTROL_LOCAL_PGTT    (0 << 2)
+#define GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH	(1 << 0)
+
+/* VERTEX_BUFFER_STATE Structure */
+#define VB0_BUFFER_INDEX_SHIFT	26
+#define VB0_VERTEXDATA			(0 << 20)
+#define VB0_INSTANCEDATA		(1 << 20)
+#define VB0_BUFFER_PITCH_SHIFT		0
+
+/* VERTEX_ELEMENT_STATE Structure */
+#define VE0_VERTEX_BUFFER_INDEX_SHIFT	26 /* for GEN6 */
+#define VE0_VALID			(1 << 25) /* for GEN6 */
+#define VE0_FORMAT_SHIFT		16
+#define VE0_OFFSET_SHIFT		0
+#define VE1_VFCOMPONENT_0_SHIFT		28
+#define VE1_VFCOMPONENT_1_SHIFT		24
+#define VE1_VFCOMPONENT_2_SHIFT		20
+#define VE1_VFCOMPONENT_3_SHIFT		16
+#define VE1_DESTINATION_ELEMENT_OFFSET_SHIFT	0
+
+/* 3DPRIMITIVE bits */
+#define GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL (0 << 15)
+#define GEN6_3DPRIMITIVE_VERTEX_RANDOM	  (1 << 15)
+/* Primitive types are in gen6_defines.h */
+#define GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT	  10
+
+#define GEN6_SVG_CTL		       0x7400
+
+#define GEN6_SVG_CTL_GS_BA	       (0 << 8)
+#define GEN6_SVG_CTL_SS_BA	       (1 << 8)
+#define GEN6_SVG_CTL_IO_BA	       (2 << 8)
+#define GEN6_SVG_CTL_GS_AUB	       (3 << 8)
+#define GEN6_SVG_CTL_IO_AUB	       (4 << 8)
+#define GEN6_SVG_CTL_SIP		       (5 << 8)
+
+#define GEN6_SVG_RDATA		       0x7404
+#define GEN6_SVG_WORK_CTL	       0x7408
+
+#define GEN6_VF_CTL		       0x7500
+
+#define GEN6_VF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_THREADID	   (0 << 8)
+#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_VF_DEBUG	   (1 << 8)
+#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_SEQUENCE   (0 << 4)
+#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_INDEX	   (1 << 4)
+#define GEN6_VF_CTL_SKIP_INITIAL_PRIMITIVES	   (1 << 3)
+#define GEN6_VF_CTL_MAX_PRIMITIVES_LIMIT_ENABLE	   (1 << 2)
+#define GEN6_VF_CTL_VERTEX_RANGE_LIMIT_ENABLE	   (1 << 1)
+#define GEN6_VF_CTL_SNAPSHOT_ENABLE	     	   (1 << 0)
+
+#define GEN6_VF_STRG_VAL		       0x7504
+#define GEN6_VF_STR_VL_OVR	       0x7508
+#define GEN6_VF_VC_OVR		       0x750c
+#define GEN6_VF_STR_PSKIP	       0x7510
+#define GEN6_VF_MAX_PRIM		       0x7514
+#define GEN6_VF_RDATA		       0x7518
+
+#define GEN6_VS_CTL		       0x7600
+#define GEN6_VS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_0	   (0 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_1	   (1 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VALID_COUNT	   (2 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VS_KERNEL_POINTER  (3 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
+#define GEN6_VS_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
+#define GEN6_VS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_VS_STRG_VAL		       0x7604
+#define GEN6_VS_RDATA		       0x7608
+
+#define GEN6_SF_CTL		       0x7b00
+#define GEN6_SF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_FF_ID	   (0 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_REL_COUNT (1 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_FF_ID	   (2 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_REL_COUNT (3 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_FF_ID	   (4 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_REL_COUNT (5 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_COUNT	   (6 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_SF_KERNEL_POINTER  (7 << 8)
+#define GEN6_SF_CTL_MIN_MAX_PRIMITIVE_RANGE_ENABLE  (1 << 4)
+#define GEN6_SF_CTL_DEBUG_CLIP_RECTANGLE_ENABLE	   (1 << 3)
+#define GEN6_SF_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
+#define GEN6_SF_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
+#define GEN6_SF_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_SF_STRG_VAL		       0x7b04
+#define GEN6_SF_RDATA		       0x7b18
+
+#define GEN6_WIZ_CTL		       0x7c00
+#define GEN6_WIZ_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_WIZ_CTL_SUBSPAN_INSTANCE_SHIFT	   16
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_WIZ_KERNEL_POINTER   (0 << 8)
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_SUBSPAN_INSTANCE     (1 << 8)
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_PRIMITIVE_SEQUENCE   (2 << 8)
+#define GEN6_WIZ_CTL_SINGLE_SUBSPAN_DISPATCH	      (1 << 6)
+#define GEN6_WIZ_CTL_IGNORE_COLOR_SCOREBOARD_STALLS    (1 << 5)
+#define GEN6_WIZ_CTL_ENABLE_SUBSPAN_INSTANCE_COMPARE   (1 << 4)
+#define GEN6_WIZ_CTL_USE_UPSTREAM_SNAPSHOT_FLAG	      (1 << 3)
+#define GEN6_WIZ_CTL_SNAPSHOT_ALL_THREADS	      (1 << 2)
+#define GEN6_WIZ_CTL_THREAD_SNAPSHOT_ENABLE	      (1 << 1)
+#define GEN6_WIZ_CTL_SNAPSHOT_ENABLE		      (1 << 0)
+
+#define GEN6_WIZ_STRG_VAL			      0x7c04
+#define GEN6_WIZ_RDATA				      0x7c18
+
+#define GEN6_TS_CTL		       0x7e00
+#define GEN6_TS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_TS_CTL_SNAPSHOT_MESSAGE_ERROR	   (0 << 8)
+#define GEN6_TS_CTL_SNAPSHOT_INTERFACE_DESCRIPTOR   (3 << 8)
+#define GEN6_TS_CTL_SNAPSHOT_ALL_CHILD_THREADS	   (1 << 2)
+#define GEN6_TS_CTL_SNAPSHOT_ALL_ROOT_THREADS  	   (1 << 1)
+#define GEN6_TS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_TS_STRG_VAL		       0x7e04
+#define GEN6_TS_RDATA		       0x7e08
+
+/* TD_CTL on gen6 is 0x7000, to not break stuff which depends on this... */
+#ifndef GEN6_TD_CTL
+#define GEN6_TD_CTL		       0x8000
+#endif
+#define GEN6_TD_CTL_MUX_SHIFT	       8
+#define GEN6_TD_CTL_EXTERNAL_HALT_R0_DEBUG_MATCH	   (1 << 7)
+#define GEN6_TD_CTL_FORCE_EXTERNAL_HALT		   (1 << 6)
+#define GEN6_TD_CTL_EXCEPTION_MASK_OVERRIDE	   (1 << 5)
+#define GEN6_TD_CTL_FORCE_THREAD_BREAKPOINT_ENABLE  (1 << 4)
+#define GEN6_TD_CTL_BREAKPOINT_ENABLE		   (1 << 2)
+#define GEN6_TD_CTL2		       0x8004
+#define GEN6_TD_CTL2_ILLEGAL_OPCODE_EXCEPTION_OVERRIDE (1 << 28)
+#define GEN6_TD_CTL2_MASKSTACK_EXCEPTION_OVERRIDE      (1 << 26)
+#define GEN6_TD_CTL2_SOFTWARE_EXCEPTION_OVERRIDE	      (1 << 25)
+#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_SHIFT	      16
+#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_ENABLE	      (1 << 8)
+#define GEN6_TD_CTL2_THREAD_SPAWNER_EXECUTION_MASK_ENABLE (1 << 7)
+#define GEN6_TD_CTL2_WIZ_EXECUTION_MASK_ENABLE	      (1 << 6)
+#define GEN6_TD_CTL2_SF_EXECUTION_MASK_ENABLE	      (1 << 5)
+#define GEN6_TD_CTL2_CLIPPER_EXECUTION_MASK_ENABLE     (1 << 4)
+#define GEN6_TD_CTL2_GS_EXECUTION_MASK_ENABLE	      (1 << 3)
+#define GEN6_TD_CTL2_VS_EXECUTION_MASK_ENABLE	      (1 << 0)
+#define GEN6_TD_VF_VS_EMSK	       0x8008
+#define GEN6_TD_GS_EMSK		       0x800c
+#define GEN6_TD_CLIP_EMSK	       0x8010
+#define GEN6_TD_SF_EMSK		       0x8014
+#define GEN6_TD_WIZ_EMSK		       0x8018
+#define GEN6_TD_0_6_EHTRG_VAL	       0x801c
+#define GEN6_TD_0_7_EHTRG_VAL	       0x8020
+#define GEN6_TD_0_6_EHTRG_MSK           0x8024
+#define GEN6_TD_0_7_EHTRG_MSK	       0x8028
+#define GEN6_TD_RDATA		       0x802c
+#define GEN6_TD_TS_EMSK		       0x8030
+
+#define GEN6_EU_CTL		       0x8800
+#define GEN6_EU_CTL_SELECT_SHIFT	       16
+#define GEN6_EU_CTL_DATA_MUX_SHIFT      8
+#define GEN6_EU_ATT_0		       0x8810
+#define GEN6_EU_ATT_1		       0x8814
+#define GEN6_EU_ATT_DATA_0	       0x8820
+#define GEN6_EU_ATT_DATA_1	       0x8824
+#define GEN6_EU_ATT_CLR_0	       0x8830
+#define GEN6_EU_ATT_CLR_1	       0x8834
+#define GEN6_EU_RDATA		       0x8840
+
+#define GEN6_3D(Pipeline,Opcode,Subopcode) ((3 << 29) | \
+					   ((Pipeline) << 27) | \
+					   ((Opcode) << 24) | \
+					   ((Subopcode) << 16))
+
+#define GEN6_STATE_BASE_ADDRESS			GEN6_3D(0, 1, 1)
+#define GEN6_STATE_SIP				GEN6_3D(0, 1, 2)
+
+#define GEN6_PIPELINE_SELECT			GEN6_3D(1, 1, 4)
+
+#define GEN6_MEDIA_STATE_POINTERS		GEN6_3D(2, 0, 0)
+#define GEN6_MEDIA_OBJECT			GEN6_3D(2, 1, 0)
+
+#define GEN6_3DSTATE_BINDING_TABLE_POINTERS	GEN6_3D(3, 0, 1)
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS  (1 << 12)/* for GEN6 */
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_GS  (1 << 9) /* for GEN6 */
+# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_VS  (1 << 8) /* for GEN6 */
+
+#define GEN6_3DSTATE_VERTEX_BUFFERS		GEN6_3D(3, 0, 8)
+#define GEN6_3DSTATE_VERTEX_ELEMENTS		GEN6_3D(3, 0, 9)
+#define GEN6_3DSTATE_INDEX_BUFFER		GEN6_3D(3, 0, 0xa)
+#define GEN6_3DSTATE_VF_STATISTICS		GEN6_3D(3, 0, 0xb)
+
+#define GEN6_3DSTATE_DRAWING_RECTANGLE		GEN6_3D(3, 1, 0)
+#define GEN6_3DSTATE_CONSTANT_COLOR		GEN6_3D(3, 1, 1)
+#define GEN6_3DSTATE_SAMPLER_PALETTE_LOAD	GEN6_3D(3, 1, 2)
+#define GEN6_3DSTATE_CHROMA_KEY			GEN6_3D(3, 1, 4)
+#define GEN6_3DSTATE_DEPTH_BUFFER		GEN6_3D(3, 1, 5)
+# define GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT	29
+# define GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT	18
+
+#define GEN6_3DSTATE_POLY_STIPPLE_OFFSET		GEN6_3D(3, 1, 6)
+#define GEN6_3DSTATE_POLY_STIPPLE_PATTERN	GEN6_3D(3, 1, 7)
+#define GEN6_3DSTATE_LINE_STIPPLE		GEN6_3D(3, 1, 8)
+#define GEN6_3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP	GEN6_3D(3, 1, 9)
+/* These two are BLC and CTG only, not BW or CL */
+#define GEN6_3DSTATE_AA_LINE_PARAMS		GEN6_3D(3, 1, 0xa)
+#define GEN6_3DSTATE_GS_SVB_INDEX		GEN6_3D(3, 1, 0xb)
+
+#define GEN6_PIPE_CONTROL			GEN6_3D(3, 2, 0)
+
+#define GEN6_3DPRIMITIVE				GEN6_3D(3, 3, 0)
+
+#define GEN6_3DSTATE_CLEAR_PARAMS		GEN6_3D(3, 1, 0x10)
+/* DW1 */
+# define GEN6_3DSTATE_DEPTH_CLEAR_VALID		(1 << 15)
+
+/* for GEN6+ */
+#define GEN6_3DSTATE_SAMPLER_STATE_POINTERS	GEN6_3D(3, 0, 0x02)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS	(1 << 12)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_GS	(1 << 9)
+# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_VS	(1 << 8)
+
+#define GEN6_3DSTATE_URB			GEN6_3D(3, 0, 0x05)
+/* DW1 */
+# define GEN6_3DSTATE_URB_VS_SIZE_SHIFT		16
+# define GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT	0
+/* DW2 */
+# define GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT	8
+# define GEN6_3DSTATE_URB_GS_SIZE_SHIFT		0
+
+#define GEN6_3DSTATE_VIEWPORT_STATE_POINTERS	GEN6_3D(3, 0, 0x0d)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC		(1 << 12)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_SF		(1 << 11)
+# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CLIP	(1 << 10)
+
+#define GEN6_3DSTATE_CC_STATE_POINTERS		GEN6_3D(3, 0, 0x0e)
+
+#define GEN6_3DSTATE_VS				GEN6_3D(3, 0, 0x10)
+
+#define GEN6_3DSTATE_GS				GEN6_3D(3, 0, 0x11)
+/* DW4 */
+# define GEN6_3DSTATE_GS_DISPATCH_START_GRF_SHIFT	0
+
+#define GEN6_3DSTATE_CLIP			GEN6_3D(3, 0, 0x12)
+
+#define GEN6_3DSTATE_SF				GEN6_3D(3, 0, 0x13)
+/* DW1 */
+# define GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT		22
+# define GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT	11
+# define GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT	4
+/* DW2 */
+/* DW3 */
+# define GEN6_3DSTATE_SF_CULL_BOTH			(0 << 29)
+# define GEN6_3DSTATE_SF_CULL_NONE			(1 << 29)
+# define GEN6_3DSTATE_SF_CULL_FRONT			(2 << 29)
+# define GEN6_3DSTATE_SF_CULL_BACK			(3 << 29)
+/* DW4 */
+# define GEN6_3DSTATE_SF_TRI_PROVOKE_SHIFT		29
+# define GEN6_3DSTATE_SF_LINE_PROVOKE_SHIFT		27
+# define GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT		25
+
+
+#define GEN6_3DSTATE_WM				GEN6_3D(3, 0, 0x14)
+/* DW2 */
+# define GEN6_3DSTATE_WM_SAMPLER_COUNT_SHITF			27
+# define GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT	18
+/* DW4 */
+# define GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT		16
+/* DW5 */
+# define GEN6_3DSTATE_WM_MAX_THREADS_SHIFT			25
+# define GEN6_3DSTATE_WM_DISPATCH_ENABLE			(1 << 19)
+# define GEN6_3DSTATE_WM_16_DISPATCH_ENABLE			(1 << 1)
+# define GEN6_3DSTATE_WM_8_DISPATCH_ENABLE			(1 << 0)
+/* DW6 */
+# define GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT			20
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC	(1 << 15)
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 14)
+# define GEN6_3DSTATE_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC	(1 << 13)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC		(1 << 12)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 11)
+# define GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC		(1 << 10)
+
+
+#define GEN6_3DSTATE_CONSTANT_VS		GEN6_3D(3, 0, 0x15)
+#define GEN6_3DSTATE_CONSTANT_GS          	GEN6_3D(3, 0, 0x16)
+#define GEN6_3DSTATE_CONSTANT_PS          	GEN6_3D(3, 0, 0x17)
+
+#define GEN6_3DSTATE_SAMPLE_MASK		GEN6_3D(3, 0, 0x18)
+
+#define GEN6_3DSTATE_MULTISAMPLE		GEN6_3D(3, 1, 0x0d)
+/* DW1 */
+# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER		(0 << 4)
+# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_UPPER_LEFT	(1 << 4)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1			(0 << 1)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_4			(2 << 1)
+# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_8			(3 << 1)
+
+#define PIPELINE_SELECT_3D		0
+#define PIPELINE_SELECT_MEDIA		1
+
+#define UF0_CS_REALLOC			(1 << 13)
+#define UF0_VFE_REALLOC			(1 << 12)
+#define UF0_SF_REALLOC			(1 << 11)
+#define UF0_CLIP_REALLOC		(1 << 10)
+#define UF0_GS_REALLOC			(1 << 9)
+#define UF0_VS_REALLOC			(1 << 8)
+#define UF1_CLIP_FENCE_SHIFT		20
+#define UF1_GS_FENCE_SHIFT		10
+#define UF1_VS_FENCE_SHIFT		0
+#define UF2_CS_FENCE_SHIFT		20
+#define UF2_VFE_FENCE_SHIFT		10
+#define UF2_SF_FENCE_SHIFT		0
+
+/* for GEN6_STATE_BASE_ADDRESS */
+#define BASE_ADDRESS_MODIFY		(1 << 0)
+
+/* for GEN6_3DSTATE_PIPELINED_POINTERS */
+#define GEN6_GS_DISABLE		       0
+#define GEN6_GS_ENABLE		       1
+#define GEN6_CLIP_DISABLE	       0
+#define GEN6_CLIP_ENABLE		       1
+
+/* for GEN6_PIPE_CONTROL */
+#define GEN6_PIPE_CONTROL_NOWRITE       (0 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_QWORD   (1 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_DEPTH   (2 << 14)
+#define GEN6_PIPE_CONTROL_WRITE_TIME    (3 << 14)
+#define GEN6_PIPE_CONTROL_DEPTH_STALL   (1 << 13)
+#define GEN6_PIPE_CONTROL_WC_FLUSH      (1 << 12)
+#define GEN6_PIPE_CONTROL_IS_FLUSH      (1 << 11)
+#define GEN6_PIPE_CONTROL_TC_FLUSH      (1 << 10)
+#define GEN6_PIPE_CONTROL_NOTIFY_ENABLE (1 << 8)
+#define GEN6_PIPE_CONTROL_GLOBAL_GTT    (1 << 2)
+#define GEN6_PIPE_CONTROL_LOCAL_PGTT    (0 << 2)
+#define GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH	(1 << 0)
+
+/* 3DPRIMITIVE bits */
+#define GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL (0 << 15)
+#define GEN6_3DPRIMITIVE_VERTEX_RANDOM	  (1 << 15)
+/* Primitive types are in gen6_defines.h */
+#define GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT	  10
+
+#define GEN6_SVG_CTL		       0x7400
+
+#define GEN6_SVG_CTL_GS_BA	       (0 << 8)
+#define GEN6_SVG_CTL_SS_BA	       (1 << 8)
+#define GEN6_SVG_CTL_IO_BA	       (2 << 8)
+#define GEN6_SVG_CTL_GS_AUB	       (3 << 8)
+#define GEN6_SVG_CTL_IO_AUB	       (4 << 8)
+#define GEN6_SVG_CTL_SIP		       (5 << 8)
+
+#define GEN6_SVG_RDATA		       0x7404
+#define GEN6_SVG_WORK_CTL	       0x7408
+
+#define GEN6_VF_CTL		       0x7500
+
+#define GEN6_VF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_THREADID	   (0 << 8)
+#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_VF_DEBUG	   (1 << 8)
+#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_SEQUENCE   (0 << 4)
+#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_INDEX	   (1 << 4)
+#define GEN6_VF_CTL_SKIP_INITIAL_PRIMITIVES	   (1 << 3)
+#define GEN6_VF_CTL_MAX_PRIMITIVES_LIMIT_ENABLE	   (1 << 2)
+#define GEN6_VF_CTL_VERTEX_RANGE_LIMIT_ENABLE	   (1 << 1)
+#define GEN6_VF_CTL_SNAPSHOT_ENABLE	     	   (1 << 0)
+
+#define GEN6_VF_STRG_VAL		       0x7504
+#define GEN6_VF_STR_VL_OVR	       0x7508
+#define GEN6_VF_VC_OVR		       0x750c
+#define GEN6_VF_STR_PSKIP	       0x7510
+#define GEN6_VF_MAX_PRIM		       0x7514
+#define GEN6_VF_RDATA		       0x7518
+
+#define GEN6_VS_CTL		       0x7600
+#define GEN6_VS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_0	   (0 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_1	   (1 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VALID_COUNT	   (2 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_MUX_VS_KERNEL_POINTER  (3 << 8)
+#define GEN6_VS_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
+#define GEN6_VS_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
+#define GEN6_VS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_VS_STRG_VAL		       0x7604
+#define GEN6_VS_RDATA		       0x7608
+
+#define GEN6_SF_CTL		       0x7b00
+#define GEN6_SF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_FF_ID	   (0 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_REL_COUNT (1 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_FF_ID	   (2 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_REL_COUNT (3 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_FF_ID	   (4 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_REL_COUNT (5 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_COUNT	   (6 << 8)
+#define GEN6_SF_CTL_SNAPSHOT_MUX_SF_KERNEL_POINTER  (7 << 8)
+#define GEN6_SF_CTL_MIN_MAX_PRIMITIVE_RANGE_ENABLE  (1 << 4)
+#define GEN6_SF_CTL_DEBUG_CLIP_RECTANGLE_ENABLE	   (1 << 3)
+#define GEN6_SF_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
+#define GEN6_SF_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
+#define GEN6_SF_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_SF_STRG_VAL		       0x7b04
+#define GEN6_SF_RDATA		       0x7b18
+
+#define GEN6_WIZ_CTL		       0x7c00
+#define GEN6_WIZ_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_WIZ_CTL_SUBSPAN_INSTANCE_SHIFT	   16
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_WIZ_KERNEL_POINTER   (0 << 8)
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_SUBSPAN_INSTANCE     (1 << 8)
+#define GEN6_WIZ_CTL_SNAPSHOT_MUX_PRIMITIVE_SEQUENCE   (2 << 8)
+#define GEN6_WIZ_CTL_SINGLE_SUBSPAN_DISPATCH	      (1 << 6)
+#define GEN6_WIZ_CTL_IGNORE_COLOR_SCOREBOARD_STALLS    (1 << 5)
+#define GEN6_WIZ_CTL_ENABLE_SUBSPAN_INSTANCE_COMPARE   (1 << 4)
+#define GEN6_WIZ_CTL_USE_UPSTREAM_SNAPSHOT_FLAG	      (1 << 3)
+#define GEN6_WIZ_CTL_SNAPSHOT_ALL_THREADS	      (1 << 2)
+#define GEN6_WIZ_CTL_THREAD_SNAPSHOT_ENABLE	      (1 << 1)
+#define GEN6_WIZ_CTL_SNAPSHOT_ENABLE		      (1 << 0)
+
+#define GEN6_WIZ_STRG_VAL			      0x7c04
+#define GEN6_WIZ_RDATA				      0x7c18
+
+#define GEN6_TS_CTL		       0x7e00
+#define GEN6_TS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
+#define GEN6_TS_CTL_SNAPSHOT_MESSAGE_ERROR	   (0 << 8)
+#define GEN6_TS_CTL_SNAPSHOT_INTERFACE_DESCRIPTOR   (3 << 8)
+#define GEN6_TS_CTL_SNAPSHOT_ALL_CHILD_THREADS	   (1 << 2)
+#define GEN6_TS_CTL_SNAPSHOT_ALL_ROOT_THREADS  	   (1 << 1)
+#define GEN6_TS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
+
+#define GEN6_TS_STRG_VAL		       0x7e04
+#define GEN6_TS_RDATA		       0x7e08
+
+/* TD_CTL on gen6 is 0x7000, to not break stuff which depends on this... */
+#ifndef GEN6_TD_CTL
+#define GEN6_TD_CTL                   0x8000
+#endif
+#define GEN6_TD_CTL_MUX_SHIFT	       8
+#define GEN6_TD_CTL_EXTERNAL_HALT_R0_DEBUG_MATCH	   (1 << 7)
+#define GEN6_TD_CTL_FORCE_EXTERNAL_HALT		   (1 << 6)
+#define GEN6_TD_CTL_EXCEPTION_MASK_OVERRIDE	   (1 << 5)
+#define GEN6_TD_CTL_FORCE_THREAD_BREAKPOINT_ENABLE  (1 << 4)
+#define GEN6_TD_CTL_BREAKPOINT_ENABLE		   (1 << 2)
+#define GEN6_TD_CTL2		       0x8004
+#define GEN6_TD_CTL2_ILLEGAL_OPCODE_EXCEPTION_OVERRIDE (1 << 28)
+#define GEN6_TD_CTL2_MASKSTACK_EXCEPTION_OVERRIDE      (1 << 26)
+#define GEN6_TD_CTL2_SOFTWARE_EXCEPTION_OVERRIDE	      (1 << 25)
+#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_SHIFT	      16
+#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_ENABLE	      (1 << 8)
+#define GEN6_TD_CTL2_THREAD_SPAWNER_EXECUTION_MASK_ENABLE (1 << 7)
+#define GEN6_TD_CTL2_WIZ_EXECUTION_MASK_ENABLE	      (1 << 6)
+#define GEN6_TD_CTL2_SF_EXECUTION_MASK_ENABLE	      (1 << 5)
+#define GEN6_TD_CTL2_CLIPPER_EXECUTION_MASK_ENABLE     (1 << 4)
+#define GEN6_TD_CTL2_GS_EXECUTION_MASK_ENABLE	      (1 << 3)
+#define GEN6_TD_CTL2_VS_EXECUTION_MASK_ENABLE	      (1 << 0)
+#define GEN6_TD_VF_VS_EMSK	       0x8008
+#define GEN6_TD_GS_EMSK		       0x800c
+#define GEN6_TD_CLIP_EMSK	       0x8010
+#define GEN6_TD_SF_EMSK		       0x8014
+#define GEN6_TD_WIZ_EMSK		       0x8018
+#define GEN6_TD_0_6_EHTRG_VAL	       0x801c
+#define GEN6_TD_0_7_EHTRG_VAL	       0x8020
+#define GEN6_TD_0_6_EHTRG_MSK           0x8024
+#define GEN6_TD_0_7_EHTRG_MSK	       0x8028
+#define GEN6_TD_RDATA		       0x802c
+#define GEN6_TD_TS_EMSK		       0x8030
+
+#define GEN6_EU_CTL		       0x8800
+#define GEN6_EU_CTL_SELECT_SHIFT	       16
+#define GEN6_EU_CTL_DATA_MUX_SHIFT      8
+#define GEN6_EU_ATT_0		       0x8810
+#define GEN6_EU_ATT_1		       0x8814
+#define GEN6_EU_ATT_DATA_0	       0x8820
+#define GEN6_EU_ATT_DATA_1	       0x8824
+#define GEN6_EU_ATT_CLR_0	       0x8830
+#define GEN6_EU_ATT_CLR_1	       0x8834
+#define GEN6_EU_RDATA		       0x8840
+
+/* 3D state:
+ */
+#define _3DOP_3DSTATE_PIPELINED       0x0
+#define _3DOP_3DSTATE_NONPIPELINED    0x1
+#define _3DOP_3DCONTROL               0x2
+#define _3DOP_3DPRIMITIVE             0x3
+
+#define _3DSTATE_PIPELINED_POINTERS       0x00
+#define _3DSTATE_BINDING_TABLE_POINTERS   0x01
+#define _3DSTATE_VERTEX_BUFFERS           0x08
+#define _3DSTATE_VERTEX_ELEMENTS          0x09
+#define _3DSTATE_INDEX_BUFFER             0x0A
+#define _3DSTATE_VF_STATISTICS            0x0B
+#define _3DSTATE_DRAWING_RECTANGLE            0x00
+#define _3DSTATE_CONSTANT_COLOR               0x01
+#define _3DSTATE_SAMPLER_PALETTE_LOAD         0x02
+#define _3DSTATE_CHROMA_KEY                   0x04
+#define _3DSTATE_DEPTH_BUFFER                 0x05
+#define _3DSTATE_POLY_STIPPLE_OFFSET          0x06
+#define _3DSTATE_POLY_STIPPLE_PATTERN         0x07
+#define _3DSTATE_LINE_STIPPLE                 0x08
+#define _3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP    0x09
+#define _3DCONTROL    0x00
+#define _3DPRIMITIVE  0x00
+
+#define _3DPRIM_POINTLIST         0x01
+#define _3DPRIM_LINELIST          0x02
+#define _3DPRIM_LINESTRIP         0x03
+#define _3DPRIM_TRILIST           0x04
+#define _3DPRIM_TRISTRIP          0x05
+#define _3DPRIM_TRIFAN            0x06
+#define _3DPRIM_QUADLIST          0x07
+#define _3DPRIM_QUADSTRIP         0x08
+#define _3DPRIM_LINELIST_ADJ      0x09
+#define _3DPRIM_LINESTRIP_ADJ     0x0A
+#define _3DPRIM_TRILIST_ADJ       0x0B
+#define _3DPRIM_TRISTRIP_ADJ      0x0C
+#define _3DPRIM_TRISTRIP_REVERSE  0x0D
+#define _3DPRIM_POLYGON           0x0E
+#define _3DPRIM_RECTLIST          0x0F
+#define _3DPRIM_LINELOOP          0x10
+#define _3DPRIM_POINTLIST_BF      0x11
+#define _3DPRIM_LINESTRIP_CONT    0x12
+#define _3DPRIM_LINESTRIP_BF      0x13
+#define _3DPRIM_LINESTRIP_CONT_BF 0x14
+#define _3DPRIM_TRIFAN_NOSTIPPLE  0x15
+
+#define _3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL 0
+#define _3DPRIM_VERTEXBUFFER_ACCESS_RANDOM     1
+
+#define GEN6_ANISORATIO_2     0 
+#define GEN6_ANISORATIO_4     1 
+#define GEN6_ANISORATIO_6     2 
+#define GEN6_ANISORATIO_8     3 
+#define GEN6_ANISORATIO_10    4 
+#define GEN6_ANISORATIO_12    5 
+#define GEN6_ANISORATIO_14    6 
+#define GEN6_ANISORATIO_16    7
+
+#define GEN6_BLENDFACTOR_ONE                 0x1
+#define GEN6_BLENDFACTOR_SRC_COLOR           0x2
+#define GEN6_BLENDFACTOR_SRC_ALPHA           0x3
+#define GEN6_BLENDFACTOR_DST_ALPHA           0x4
+#define GEN6_BLENDFACTOR_DST_COLOR           0x5
+#define GEN6_BLENDFACTOR_SRC_ALPHA_SATURATE  0x6
+#define GEN6_BLENDFACTOR_CONST_COLOR         0x7
+#define GEN6_BLENDFACTOR_CONST_ALPHA         0x8
+#define GEN6_BLENDFACTOR_SRC1_COLOR          0x9
+#define GEN6_BLENDFACTOR_SRC1_ALPHA          0x0A
+#define GEN6_BLENDFACTOR_ZERO                0x11
+#define GEN6_BLENDFACTOR_INV_SRC_COLOR       0x12
+#define GEN6_BLENDFACTOR_INV_SRC_ALPHA       0x13
+#define GEN6_BLENDFACTOR_INV_DST_ALPHA       0x14
+#define GEN6_BLENDFACTOR_INV_DST_COLOR       0x15
+#define GEN6_BLENDFACTOR_INV_CONST_COLOR     0x17
+#define GEN6_BLENDFACTOR_INV_CONST_ALPHA     0x18
+#define GEN6_BLENDFACTOR_INV_SRC1_COLOR      0x19
+#define GEN6_BLENDFACTOR_INV_SRC1_ALPHA      0x1A
+
+#define GEN6_BLENDFUNCTION_ADD               0
+#define GEN6_BLENDFUNCTION_SUBTRACT          1
+#define GEN6_BLENDFUNCTION_REVERSE_SUBTRACT  2
+#define GEN6_BLENDFUNCTION_MIN               3
+#define GEN6_BLENDFUNCTION_MAX               4
+
+#define GEN6_ALPHATEST_FORMAT_UNORM8         0
+#define GEN6_ALPHATEST_FORMAT_FLOAT32        1
+
+#define GEN6_CHROMAKEY_KILL_ON_ANY_MATCH  0
+#define GEN6_CHROMAKEY_REPLACE_BLACK      1
+
+#define GEN6_CLIP_API_OGL     0
+#define GEN6_CLIP_API_DX      1
+
+#define GEN6_CLIPMODE_NORMAL              0
+#define GEN6_CLIPMODE_CLIP_ALL            1
+#define GEN6_CLIPMODE_CLIP_NON_REJECTED   2
+#define GEN6_CLIPMODE_REJECT_ALL          3
+#define GEN6_CLIPMODE_ACCEPT_ALL          4
+
+#define GEN6_CLIP_NDCSPACE     0
+#define GEN6_CLIP_SCREENSPACE  1
+
+#define GEN6_COMPAREFUNCTION_ALWAYS       0
+#define GEN6_COMPAREFUNCTION_NEVER        1
+#define GEN6_COMPAREFUNCTION_LESS         2
+#define GEN6_COMPAREFUNCTION_EQUAL        3
+#define GEN6_COMPAREFUNCTION_LEQUAL       4
+#define GEN6_COMPAREFUNCTION_GREATER      5
+#define GEN6_COMPAREFUNCTION_NOTEQUAL     6
+#define GEN6_COMPAREFUNCTION_GEQUAL       7
+
+#define GEN6_COVERAGE_PIXELS_HALF     0
+#define GEN6_COVERAGE_PIXELS_1        1
+#define GEN6_COVERAGE_PIXELS_2        2
+#define GEN6_COVERAGE_PIXELS_4        3
+
+#define GEN6_CULLMODE_BOTH        0
+#define GEN6_CULLMODE_NONE        1
+#define GEN6_CULLMODE_FRONT       2
+#define GEN6_CULLMODE_BACK        3
+
+#define GEN6_DEFAULTCOLOR_R8G8B8A8_UNORM      0
+#define GEN6_DEFAULTCOLOR_R32G32B32A32_FLOAT  1
+
+#define GEN6_DEPTHFORMAT_D32_FLOAT_S8X24_UINT     0
+#define GEN6_DEPTHFORMAT_D32_FLOAT                1
+#define GEN6_DEPTHFORMAT_D24_UNORM_S8_UINT        2
+#define GEN6_DEPTHFORMAT_D16_UNORM                5
+
+#define GEN6_FLOATING_POINT_IEEE_754        0
+#define GEN6_FLOATING_POINT_NON_IEEE_754    1
+
+#define GEN6_FRONTWINDING_CW      0
+#define GEN6_FRONTWINDING_CCW     1
+
+#define GEN6_INDEX_BYTE     0
+#define GEN6_INDEX_WORD     1
+#define GEN6_INDEX_DWORD    2
+
+#define GEN6_LOGICOPFUNCTION_CLEAR            0
+#define GEN6_LOGICOPFUNCTION_NOR              1
+#define GEN6_LOGICOPFUNCTION_AND_INVERTED     2
+#define GEN6_LOGICOPFUNCTION_COPY_INVERTED    3
+#define GEN6_LOGICOPFUNCTION_AND_REVERSE      4
+#define GEN6_LOGICOPFUNCTION_INVERT           5
+#define GEN6_LOGICOPFUNCTION_XOR              6
+#define GEN6_LOGICOPFUNCTION_NAND             7
+#define GEN6_LOGICOPFUNCTION_AND              8
+#define GEN6_LOGICOPFUNCTION_EQUIV            9
+#define GEN6_LOGICOPFUNCTION_NOOP             10
+#define GEN6_LOGICOPFUNCTION_OR_INVERTED      11
+#define GEN6_LOGICOPFUNCTION_COPY             12
+#define GEN6_LOGICOPFUNCTION_OR_REVERSE       13
+#define GEN6_LOGICOPFUNCTION_OR               14
+#define GEN6_LOGICOPFUNCTION_SET              15  
+
+#define GEN6_MAPFILTER_NEAREST        0x0 
+#define GEN6_MAPFILTER_LINEAR         0x1 
+#define GEN6_MAPFILTER_ANISOTROPIC    0x2
+
+#define GEN6_MIPFILTER_NONE        0   
+#define GEN6_MIPFILTER_NEAREST     1   
+#define GEN6_MIPFILTER_LINEAR      3
+
+#define GEN6_POLYGON_FRONT_FACING     0
+#define GEN6_POLYGON_BACK_FACING      1
+
+#define GEN6_PREFILTER_ALWAYS     0x0 
+#define GEN6_PREFILTER_NEVER      0x1
+#define GEN6_PREFILTER_LESS       0x2
+#define GEN6_PREFILTER_EQUAL      0x3
+#define GEN6_PREFILTER_LEQUAL     0x4
+#define GEN6_PREFILTER_GREATER    0x5
+#define GEN6_PREFILTER_NOTEQUAL   0x6
+#define GEN6_PREFILTER_GEQUAL     0x7
+
+#define GEN6_PROVOKING_VERTEX_0    0
+#define GEN6_PROVOKING_VERTEX_1    1 
+#define GEN6_PROVOKING_VERTEX_2    2
+
+#define GEN6_RASTRULE_UPPER_LEFT  0    
+#define GEN6_RASTRULE_UPPER_RIGHT 1
+
+#define GEN6_RENDERTARGET_CLAMPRANGE_UNORM    0
+#define GEN6_RENDERTARGET_CLAMPRANGE_SNORM    1
+#define GEN6_RENDERTARGET_CLAMPRANGE_FORMAT   2
+
+#define GEN6_STENCILOP_KEEP               0
+#define GEN6_STENCILOP_ZERO               1
+#define GEN6_STENCILOP_REPLACE            2
+#define GEN6_STENCILOP_INCRSAT            3
+#define GEN6_STENCILOP_DECRSAT            4
+#define GEN6_STENCILOP_INCR               5
+#define GEN6_STENCILOP_DECR               6
+#define GEN6_STENCILOP_INVERT             7
+
+#define GEN6_SURFACE_MIPMAPLAYOUT_BELOW   0
+#define GEN6_SURFACE_MIPMAPLAYOUT_RIGHT   1
+
+#define GEN6_SURFACEFORMAT_R32G32B32A32_FLOAT             0x000
+#define GEN6_SURFACEFORMAT_R32G32B32A32_SINT              0x001
+#define GEN6_SURFACEFORMAT_R32G32B32A32_UINT              0x002
+#define GEN6_SURFACEFORMAT_R32G32B32A32_UNORM             0x003
+#define GEN6_SURFACEFORMAT_R32G32B32A32_SNORM             0x004
+#define GEN6_SURFACEFORMAT_R64G64_FLOAT                   0x005
+#define GEN6_SURFACEFORMAT_R32G32B32X32_FLOAT             0x006
+#define GEN6_SURFACEFORMAT_R32G32B32A32_SSCALED           0x007
+#define GEN6_SURFACEFORMAT_R32G32B32A32_USCALED           0x008
+#define GEN6_SURFACEFORMAT_R32G32B32_FLOAT                0x040
+#define GEN6_SURFACEFORMAT_R32G32B32_SINT                 0x041
+#define GEN6_SURFACEFORMAT_R32G32B32_UINT                 0x042
+#define GEN6_SURFACEFORMAT_R32G32B32_UNORM                0x043
+#define GEN6_SURFACEFORMAT_R32G32B32_SNORM                0x044
+#define GEN6_SURFACEFORMAT_R32G32B32_SSCALED              0x045
+#define GEN6_SURFACEFORMAT_R32G32B32_USCALED              0x046
+#define GEN6_SURFACEFORMAT_R16G16B16A16_UNORM             0x080
+#define GEN6_SURFACEFORMAT_R16G16B16A16_SNORM             0x081
+#define GEN6_SURFACEFORMAT_R16G16B16A16_SINT              0x082
+#define GEN6_SURFACEFORMAT_R16G16B16A16_UINT              0x083
+#define GEN6_SURFACEFORMAT_R16G16B16A16_FLOAT             0x084
+#define GEN6_SURFACEFORMAT_R32G32_FLOAT                   0x085
+#define GEN6_SURFACEFORMAT_R32G32_SINT                    0x086
+#define GEN6_SURFACEFORMAT_R32G32_UINT                    0x087
+#define GEN6_SURFACEFORMAT_R32_FLOAT_X8X24_TYPELESS       0x088
+#define GEN6_SURFACEFORMAT_X32_TYPELESS_G8X24_UINT        0x089
+#define GEN6_SURFACEFORMAT_L32A32_FLOAT                   0x08A
+#define GEN6_SURFACEFORMAT_R32G32_UNORM                   0x08B
+#define GEN6_SURFACEFORMAT_R32G32_SNORM                   0x08C
+#define GEN6_SURFACEFORMAT_R64_FLOAT                      0x08D
+#define GEN6_SURFACEFORMAT_R16G16B16X16_UNORM             0x08E
+#define GEN6_SURFACEFORMAT_R16G16B16X16_FLOAT             0x08F
+#define GEN6_SURFACEFORMAT_A32X32_FLOAT                   0x090
+#define GEN6_SURFACEFORMAT_L32X32_FLOAT                   0x091
+#define GEN6_SURFACEFORMAT_I32X32_FLOAT                   0x092
+#define GEN6_SURFACEFORMAT_R16G16B16A16_SSCALED           0x093
+#define GEN6_SURFACEFORMAT_R16G16B16A16_USCALED           0x094
+#define GEN6_SURFACEFORMAT_R32G32_SSCALED                 0x095
+#define GEN6_SURFACEFORMAT_R32G32_USCALED                 0x096
+#define GEN6_SURFACEFORMAT_B8G8R8A8_UNORM                 0x0C0
+#define GEN6_SURFACEFORMAT_B8G8R8A8_UNORM_SRGB            0x0C1
+#define GEN6_SURFACEFORMAT_R10G10B10A2_UNORM              0x0C2
+#define GEN6_SURFACEFORMAT_R10G10B10A2_UNORM_SRGB         0x0C3
+#define GEN6_SURFACEFORMAT_R10G10B10A2_UINT               0x0C4
+#define GEN6_SURFACEFORMAT_R10G10B10_SNORM_A2_UNORM       0x0C5
+#define GEN6_SURFACEFORMAT_R8G8B8A8_UNORM                 0x0C7
+#define GEN6_SURFACEFORMAT_R8G8B8A8_UNORM_SRGB            0x0C8
+#define GEN6_SURFACEFORMAT_R8G8B8A8_SNORM                 0x0C9
+#define GEN6_SURFACEFORMAT_R8G8B8A8_SINT                  0x0CA
+#define GEN6_SURFACEFORMAT_R8G8B8A8_UINT                  0x0CB
+#define GEN6_SURFACEFORMAT_R16G16_UNORM                   0x0CC
+#define GEN6_SURFACEFORMAT_R16G16_SNORM                   0x0CD
+#define GEN6_SURFACEFORMAT_R16G16_SINT                    0x0CE
+#define GEN6_SURFACEFORMAT_R16G16_UINT                    0x0CF
+#define GEN6_SURFACEFORMAT_R16G16_FLOAT                   0x0D0
+#define GEN6_SURFACEFORMAT_B10G10R10A2_UNORM              0x0D1
+#define GEN6_SURFACEFORMAT_B10G10R10A2_UNORM_SRGB         0x0D2
+#define GEN6_SURFACEFORMAT_R11G11B10_FLOAT                0x0D3
+#define GEN6_SURFACEFORMAT_R32_SINT                       0x0D6
+#define GEN6_SURFACEFORMAT_R32_UINT                       0x0D7
+#define GEN6_SURFACEFORMAT_R32_FLOAT                      0x0D8
+#define GEN6_SURFACEFORMAT_R24_UNORM_X8_TYPELESS          0x0D9
+#define GEN6_SURFACEFORMAT_X24_TYPELESS_G8_UINT           0x0DA
+#define GEN6_SURFACEFORMAT_L16A16_UNORM                   0x0DF
+#define GEN6_SURFACEFORMAT_I24X8_UNORM                    0x0E0
+#define GEN6_SURFACEFORMAT_L24X8_UNORM                    0x0E1
+#define GEN6_SURFACEFORMAT_A24X8_UNORM                    0x0E2
+#define GEN6_SURFACEFORMAT_I32_FLOAT                      0x0E3
+#define GEN6_SURFACEFORMAT_L32_FLOAT                      0x0E4
+#define GEN6_SURFACEFORMAT_A32_FLOAT                      0x0E5
+#define GEN6_SURFACEFORMAT_B8G8R8X8_UNORM                 0x0E9
+#define GEN6_SURFACEFORMAT_B8G8R8X8_UNORM_SRGB            0x0EA
+#define GEN6_SURFACEFORMAT_R8G8B8X8_UNORM                 0x0EB
+#define GEN6_SURFACEFORMAT_R8G8B8X8_UNORM_SRGB            0x0EC
+#define GEN6_SURFACEFORMAT_R9G9B9E5_SHAREDEXP             0x0ED
+#define GEN6_SURFACEFORMAT_B10G10R10X2_UNORM              0x0EE
+#define GEN6_SURFACEFORMAT_L16A16_FLOAT                   0x0F0
+#define GEN6_SURFACEFORMAT_R32_UNORM                      0x0F1
+#define GEN6_SURFACEFORMAT_R32_SNORM                      0x0F2
+#define GEN6_SURFACEFORMAT_R10G10B10X2_USCALED            0x0F3
+#define GEN6_SURFACEFORMAT_R8G8B8A8_SSCALED               0x0F4
+#define GEN6_SURFACEFORMAT_R8G8B8A8_USCALED               0x0F5
+#define GEN6_SURFACEFORMAT_R16G16_SSCALED                 0x0F6
+#define GEN6_SURFACEFORMAT_R16G16_USCALED                 0x0F7
+#define GEN6_SURFACEFORMAT_R32_SSCALED                    0x0F8
+#define GEN6_SURFACEFORMAT_R32_USCALED                    0x0F9
+#define GEN6_SURFACEFORMAT_B5G6R5_UNORM                   0x100
+#define GEN6_SURFACEFORMAT_B5G6R5_UNORM_SRGB              0x101
+#define GEN6_SURFACEFORMAT_B5G5R5A1_UNORM                 0x102
+#define GEN6_SURFACEFORMAT_B5G5R5A1_UNORM_SRGB            0x103
+#define GEN6_SURFACEFORMAT_B4G4R4A4_UNORM                 0x104
+#define GEN6_SURFACEFORMAT_B4G4R4A4_UNORM_SRGB            0x105
+#define GEN6_SURFACEFORMAT_R8G8_UNORM                     0x106
+#define GEN6_SURFACEFORMAT_R8G8_SNORM                     0x107
+#define GEN6_SURFACEFORMAT_R8G8_SINT                      0x108
+#define GEN6_SURFACEFORMAT_R8G8_UINT                      0x109
+#define GEN6_SURFACEFORMAT_R16_UNORM                      0x10A
+#define GEN6_SURFACEFORMAT_R16_SNORM                      0x10B
+#define GEN6_SURFACEFORMAT_R16_SINT                       0x10C
+#define GEN6_SURFACEFORMAT_R16_UINT                       0x10D
+#define GEN6_SURFACEFORMAT_R16_FLOAT                      0x10E
+#define GEN6_SURFACEFORMAT_I16_UNORM                      0x111
+#define GEN6_SURFACEFORMAT_L16_UNORM                      0x112
+#define GEN6_SURFACEFORMAT_A16_UNORM                      0x113
+#define GEN6_SURFACEFORMAT_L8A8_UNORM                     0x114
+#define GEN6_SURFACEFORMAT_I16_FLOAT                      0x115
+#define GEN6_SURFACEFORMAT_L16_FLOAT                      0x116
+#define GEN6_SURFACEFORMAT_A16_FLOAT                      0x117
+#define GEN6_SURFACEFORMAT_R5G5_SNORM_B6_UNORM            0x119
+#define GEN6_SURFACEFORMAT_B5G5R5X1_UNORM                 0x11A
+#define GEN6_SURFACEFORMAT_B5G5R5X1_UNORM_SRGB            0x11B
+#define GEN6_SURFACEFORMAT_R8G8_SSCALED                   0x11C
+#define GEN6_SURFACEFORMAT_R8G8_USCALED                   0x11D
+#define GEN6_SURFACEFORMAT_R16_SSCALED                    0x11E
+#define GEN6_SURFACEFORMAT_R16_USCALED                    0x11F
+#define GEN6_SURFACEFORMAT_R8_UNORM                       0x140
+#define GEN6_SURFACEFORMAT_R8_SNORM                       0x141
+#define GEN6_SURFACEFORMAT_R8_SINT                        0x142
+#define GEN6_SURFACEFORMAT_R8_UINT                        0x143
+#define GEN6_SURFACEFORMAT_A8_UNORM                       0x144
+#define GEN6_SURFACEFORMAT_I8_UNORM                       0x145
+#define GEN6_SURFACEFORMAT_L8_UNORM                       0x146
+#define GEN6_SURFACEFORMAT_P4A4_UNORM                     0x147
+#define GEN6_SURFACEFORMAT_A4P4_UNORM                     0x148
+#define GEN6_SURFACEFORMAT_R8_SSCALED                     0x149
+#define GEN6_SURFACEFORMAT_R8_USCALED                     0x14A
+#define GEN6_SURFACEFORMAT_R1_UINT                        0x181
+#define GEN6_SURFACEFORMAT_YCRCB_NORMAL                   0x182
+#define GEN6_SURFACEFORMAT_YCRCB_SWAPUVY                  0x183
+#define GEN6_SURFACEFORMAT_BC1_UNORM                      0x186
+#define GEN6_SURFACEFORMAT_BC2_UNORM                      0x187
+#define GEN6_SURFACEFORMAT_BC3_UNORM                      0x188
+#define GEN6_SURFACEFORMAT_BC4_UNORM                      0x189
+#define GEN6_SURFACEFORMAT_BC5_UNORM                      0x18A
+#define GEN6_SURFACEFORMAT_BC1_UNORM_SRGB                 0x18B
+#define GEN6_SURFACEFORMAT_BC2_UNORM_SRGB                 0x18C
+#define GEN6_SURFACEFORMAT_BC3_UNORM_SRGB                 0x18D
+#define GEN6_SURFACEFORMAT_MONO8                          0x18E
+#define GEN6_SURFACEFORMAT_YCRCB_SWAPUV                   0x18F
+#define GEN6_SURFACEFORMAT_YCRCB_SWAPY                    0x190
+#define GEN6_SURFACEFORMAT_DXT1_RGB                       0x191
+#define GEN6_SURFACEFORMAT_FXT1                           0x192
+#define GEN6_SURFACEFORMAT_R8G8B8_UNORM                   0x193
+#define GEN6_SURFACEFORMAT_R8G8B8_SNORM                   0x194
+#define GEN6_SURFACEFORMAT_R8G8B8_SSCALED                 0x195
+#define GEN6_SURFACEFORMAT_R8G8B8_USCALED                 0x196
+#define GEN6_SURFACEFORMAT_R64G64B64A64_FLOAT             0x197
+#define GEN6_SURFACEFORMAT_R64G64B64_FLOAT                0x198
+#define GEN6_SURFACEFORMAT_BC4_SNORM                      0x199
+#define GEN6_SURFACEFORMAT_BC5_SNORM                      0x19A
+#define GEN6_SURFACEFORMAT_R16G16B16_UNORM                0x19C
+#define GEN6_SURFACEFORMAT_R16G16B16_SNORM                0x19D
+#define GEN6_SURFACEFORMAT_R16G16B16_SSCALED              0x19E
+#define GEN6_SURFACEFORMAT_R16G16B16_USCALED              0x19F
+
+#define GEN6_SURFACERETURNFORMAT_FLOAT32  0
+#define GEN6_SURFACERETURNFORMAT_S1       1
+
+#define GEN6_SURFACE_1D      0
+#define GEN6_SURFACE_2D      1
+#define GEN6_SURFACE_3D      2
+#define GEN6_SURFACE_CUBE    3
+#define GEN6_SURFACE_BUFFER  4
+#define GEN6_SURFACE_NULL    7
+
+#define GEN6_BORDER_COLOR_MODE_DEFAULT	0
+#define GEN6_BORDER_COLOR_MODE_LEGACY	1
+
+#define GEN6_TEXCOORDMODE_WRAP            0
+#define GEN6_TEXCOORDMODE_MIRROR          1
+#define GEN6_TEXCOORDMODE_CLAMP           2
+#define GEN6_TEXCOORDMODE_CUBE            3
+#define GEN6_TEXCOORDMODE_CLAMP_BORDER    4
+#define GEN6_TEXCOORDMODE_MIRROR_ONCE     5
+
+#define GEN6_THREAD_PRIORITY_NORMAL   0
+#define GEN6_THREAD_PRIORITY_HIGH     1
+
+#define GEN6_TILEWALK_XMAJOR                 0
+#define GEN6_TILEWALK_YMAJOR                 1
+
+#define GEN6_VERTEX_SUBPIXEL_PRECISION_8BITS  0
+#define GEN6_VERTEX_SUBPIXEL_PRECISION_4BITS  1
+
+#define GEN6_VERTEXBUFFER_ACCESS_VERTEXDATA     0
+#define GEN6_VERTEXBUFFER_ACCESS_INSTANCEDATA   1
+
+#define GEN6_VFCOMPONENT_NOSTORE      0
+#define GEN6_VFCOMPONENT_STORE_SRC    1
+#define GEN6_VFCOMPONENT_STORE_0      2
+#define GEN6_VFCOMPONENT_STORE_1_FLT  3
+#define GEN6_VFCOMPONENT_STORE_1_INT  4
+#define GEN6_VFCOMPONENT_STORE_VID    5
+#define GEN6_VFCOMPONENT_STORE_IID    6
+#define GEN6_VFCOMPONENT_STORE_PID    7
+
+
+
+/* Execution Unit (EU) defines
+ */
+
+#define GEN6_ALIGN_1   0
+#define GEN6_ALIGN_16  1
+
+#define GEN6_ADDRESS_DIRECT                        0
+#define GEN6_ADDRESS_REGISTER_INDIRECT_REGISTER    1
+
+#define GEN6_CHANNEL_X     0
+#define GEN6_CHANNEL_Y     1
+#define GEN6_CHANNEL_Z     2
+#define GEN6_CHANNEL_W     3
+
+#define GEN6_COMPRESSION_NONE          0
+#define GEN6_COMPRESSION_2NDHALF       1
+#define GEN6_COMPRESSION_COMPRESSED    2
+
+#define GEN6_CONDITIONAL_NONE  0
+#define GEN6_CONDITIONAL_Z     1
+#define GEN6_CONDITIONAL_NZ    2
+#define GEN6_CONDITIONAL_EQ    1	/* Z */
+#define GEN6_CONDITIONAL_NEQ   2	/* NZ */
+#define GEN6_CONDITIONAL_G     3
+#define GEN6_CONDITIONAL_GE    4
+#define GEN6_CONDITIONAL_L     5
+#define GEN6_CONDITIONAL_LE    6
+#define GEN6_CONDITIONAL_C     7
+#define GEN6_CONDITIONAL_O     8
+
+#define GEN6_DEBUG_NONE        0
+#define GEN6_DEBUG_BREAKPOINT  1
+
+#define GEN6_DEPENDENCY_NORMAL         0
+#define GEN6_DEPENDENCY_NOTCLEARED     1
+#define GEN6_DEPENDENCY_NOTCHECKED     2
+#define GEN6_DEPENDENCY_DISABLE        3
+
+#define GEN6_EXECUTE_1     0
+#define GEN6_EXECUTE_2     1
+#define GEN6_EXECUTE_4     2
+#define GEN6_EXECUTE_8     3
+#define GEN6_EXECUTE_16    4
+#define GEN6_EXECUTE_32    5
+
+#define GEN6_HORIZONTAL_STRIDE_0   0
+#define GEN6_HORIZONTAL_STRIDE_1   1
+#define GEN6_HORIZONTAL_STRIDE_2   2
+#define GEN6_HORIZONTAL_STRIDE_4   3
+
+#define GEN6_INSTRUCTION_NORMAL    0
+#define GEN6_INSTRUCTION_SATURATE  1
+
+#define GEN6_MASK_ENABLE   0
+#define GEN6_MASK_DISABLE  1
+
+#define GEN6_OPCODE_MOV        1
+#define GEN6_OPCODE_SEL        2
+#define GEN6_OPCODE_NOT        4
+#define GEN6_OPCODE_AND        5
+#define GEN6_OPCODE_OR         6
+#define GEN6_OPCODE_XOR        7
+#define GEN6_OPCODE_SHR        8
+#define GEN6_OPCODE_SHL        9
+#define GEN6_OPCODE_RSR        10
+#define GEN6_OPCODE_RSL        11
+#define GEN6_OPCODE_ASR        12
+#define GEN6_OPCODE_CMP        16
+#define GEN6_OPCODE_JMPI       32
+#define GEN6_OPCODE_IF         34
+#define GEN6_OPCODE_IFF        35
+#define GEN6_OPCODE_ELSE       36
+#define GEN6_OPCODE_ENDIF      37
+#define GEN6_OPCODE_DO         38
+#define GEN6_OPCODE_WHILE      39
+#define GEN6_OPCODE_BREAK      40
+#define GEN6_OPCODE_CONTINUE   41
+#define GEN6_OPCODE_HALT       42
+#define GEN6_OPCODE_MSAVE      44
+#define GEN6_OPCODE_MRESTORE   45
+#define GEN6_OPCODE_PUSH       46
+#define GEN6_OPCODE_POP        47
+#define GEN6_OPCODE_WAIT       48
+#define GEN6_OPCODE_SEND       49
+#define GEN6_OPCODE_ADD        64
+#define GEN6_OPCODE_MUL        65
+#define GEN6_OPCODE_AVG        66
+#define GEN6_OPCODE_FRC        67
+#define GEN6_OPCODE_RNDU       68
+#define GEN6_OPCODE_RNDD       69
+#define GEN6_OPCODE_RNDE       70
+#define GEN6_OPCODE_RNDZ       71
+#define GEN6_OPCODE_MAC        72
+#define GEN6_OPCODE_MACH       73
+#define GEN6_OPCODE_LZD        74
+#define GEN6_OPCODE_SAD2       80
+#define GEN6_OPCODE_SADA2      81
+#define GEN6_OPCODE_DP4        84
+#define GEN6_OPCODE_DPH        85
+#define GEN6_OPCODE_DP3        86
+#define GEN6_OPCODE_DP2        87
+#define GEN6_OPCODE_DPA2       88
+#define GEN6_OPCODE_LINE       89
+#define GEN6_OPCODE_NOP        126
+
+#define GEN6_PREDICATE_NONE             0
+#define GEN6_PREDICATE_NORMAL           1
+#define GEN6_PREDICATE_ALIGN1_ANYV             2
+#define GEN6_PREDICATE_ALIGN1_ALLV             3
+#define GEN6_PREDICATE_ALIGN1_ANY2H            4
+#define GEN6_PREDICATE_ALIGN1_ALL2H            5
+#define GEN6_PREDICATE_ALIGN1_ANY4H            6
+#define GEN6_PREDICATE_ALIGN1_ALL4H            7
+#define GEN6_PREDICATE_ALIGN1_ANY8H            8
+#define GEN6_PREDICATE_ALIGN1_ALL8H            9
+#define GEN6_PREDICATE_ALIGN1_ANY16H           10
+#define GEN6_PREDICATE_ALIGN1_ALL16H           11
+#define GEN6_PREDICATE_ALIGN16_REPLICATE_X     2
+#define GEN6_PREDICATE_ALIGN16_REPLICATE_Y     3
+#define GEN6_PREDICATE_ALIGN16_REPLICATE_Z     4
+#define GEN6_PREDICATE_ALIGN16_REPLICATE_W     5
+#define GEN6_PREDICATE_ALIGN16_ANY4H           6
+#define GEN6_PREDICATE_ALIGN16_ALL4H           7
+
+#define GEN6_ARCHITECTURE_REGISTER_FILE    0
+#define GEN6_GENERAL_REGISTER_FILE         1
+#define GEN6_MESSAGE_REGISTER_FILE         2
+#define GEN6_IMMEDIATE_VALUE               3
+
+#define GEN6_REGISTER_TYPE_UD  0
+#define GEN6_REGISTER_TYPE_D   1
+#define GEN6_REGISTER_TYPE_UW  2
+#define GEN6_REGISTER_TYPE_W   3
+#define GEN6_REGISTER_TYPE_UB  4
+#define GEN6_REGISTER_TYPE_B   5
+#define GEN6_REGISTER_TYPE_VF  5	/* packed float vector, immediates only? */
+#define GEN6_REGISTER_TYPE_HF  6
+#define GEN6_REGISTER_TYPE_V   6	/* packed int vector, immediates only, uword dest only */
+#define GEN6_REGISTER_TYPE_F   7
+
+#define GEN6_ARF_NULL                  0x00
+#define GEN6_ARF_ADDRESS               0x10
+#define GEN6_ARF_ACCUMULATOR           0x20   
+#define GEN6_ARF_FLAG                  0x30
+#define GEN6_ARF_MASK                  0x40
+#define GEN6_ARF_MASK_STACK            0x50
+#define GEN6_ARF_MASK_STACK_DEPTH      0x60
+#define GEN6_ARF_STATE                 0x70
+#define GEN6_ARF_CONTROL               0x80
+#define GEN6_ARF_NOTIFICATION_COUNT    0x90
+#define GEN6_ARF_IP                    0xA0
+
+#define GEN6_AMASK   0
+#define GEN6_IMASK   1
+#define GEN6_LMASK   2
+#define GEN6_CMASK   3
+
+
+
+#define GEN6_THREAD_NORMAL     0
+#define GEN6_THREAD_ATOMIC     1
+#define GEN6_THREAD_SWITCH     2
+
+#define GEN6_VERTICAL_STRIDE_0                 0
+#define GEN6_VERTICAL_STRIDE_1                 1
+#define GEN6_VERTICAL_STRIDE_2                 2
+#define GEN6_VERTICAL_STRIDE_4                 3
+#define GEN6_VERTICAL_STRIDE_8                 4
+#define GEN6_VERTICAL_STRIDE_16                5
+#define GEN6_VERTICAL_STRIDE_32                6
+#define GEN6_VERTICAL_STRIDE_64                7
+#define GEN6_VERTICAL_STRIDE_128               8
+#define GEN6_VERTICAL_STRIDE_256               9
+#define GEN6_VERTICAL_STRIDE_ONE_DIMENSIONAL   0xF
+
+#define GEN6_WIDTH_1       0
+#define GEN6_WIDTH_2       1
+#define GEN6_WIDTH_4       2
+#define GEN6_WIDTH_8       3
+#define GEN6_WIDTH_16      4
+
+#define GEN6_STATELESS_BUFFER_BOUNDARY_1K      0
+#define GEN6_STATELESS_BUFFER_BOUNDARY_2K      1
+#define GEN6_STATELESS_BUFFER_BOUNDARY_4K      2
+#define GEN6_STATELESS_BUFFER_BOUNDARY_8K      3
+#define GEN6_STATELESS_BUFFER_BOUNDARY_16K     4
+#define GEN6_STATELESS_BUFFER_BOUNDARY_32K     5
+#define GEN6_STATELESS_BUFFER_BOUNDARY_64K     6
+#define GEN6_STATELESS_BUFFER_BOUNDARY_128K    7
+#define GEN6_STATELESS_BUFFER_BOUNDARY_256K    8
+#define GEN6_STATELESS_BUFFER_BOUNDARY_512K    9
+#define GEN6_STATELESS_BUFFER_BOUNDARY_1M      10
+#define GEN6_STATELESS_BUFFER_BOUNDARY_2M      11
+
+#define GEN6_POLYGON_FACING_FRONT      0
+#define GEN6_POLYGON_FACING_BACK       1
+
+#define GEN6_MESSAGE_TARGET_NULL               0
+#define GEN6_MESSAGE_TARGET_MATH               1
+#define GEN6_MESSAGE_TARGET_SAMPLER            2
+#define GEN6_MESSAGE_TARGET_GATEWAY            3
+#define GEN6_MESSAGE_TARGET_DATAPORT_READ      4
+#define GEN6_MESSAGE_TARGET_DATAPORT_WRITE     5
+#define GEN6_MESSAGE_TARGET_URB                6
+#define GEN6_MESSAGE_TARGET_THREAD_SPAWNER     7
+
+#define GEN6_SAMPLER_RETURN_FORMAT_FLOAT32     0
+#define GEN6_SAMPLER_RETURN_FORMAT_UINT32      2
+#define GEN6_SAMPLER_RETURN_FORMAT_SINT32      3
+
+#define GEN6_SAMPLER_MESSAGE_SIMD8_SAMPLE              0
+#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE             0
+#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_BIAS        0
+#define GEN6_SAMPLER_MESSAGE_SIMD8_KILLPIX             1
+#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD        1
+#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_LOD         1
+#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_GRADIENTS  2
+#define GEN6_SAMPLER_MESSAGE_SIMD8_SAMPLE_GRADIENTS    2
+#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_COMPARE    0
+#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE     2
+#define GEN6_SAMPLER_MESSAGE_SIMD4X2_RESINFO           2
+#define GEN6_SAMPLER_MESSAGE_SIMD8_RESINFO             2
+#define GEN6_SAMPLER_MESSAGE_SIMD16_RESINFO            2
+#define GEN6_SAMPLER_MESSAGE_SIMD4X2_LD                3
+#define GEN6_SAMPLER_MESSAGE_SIMD8_LD                  3
+#define GEN6_SAMPLER_MESSAGE_SIMD16_LD                 3
+
+#define GEN6_DATAPORT_OWORD_BLOCK_1_OWORDLOW   0
+#define GEN6_DATAPORT_OWORD_BLOCK_1_OWORDHIGH  1
+#define GEN6_DATAPORT_OWORD_BLOCK_2_OWORDS     2
+#define GEN6_DATAPORT_OWORD_BLOCK_4_OWORDS     3
+#define GEN6_DATAPORT_OWORD_BLOCK_8_OWORDS     4
+
+#define GEN6_DATAPORT_OWORD_DUAL_BLOCK_1OWORD     0
+#define GEN6_DATAPORT_OWORD_DUAL_BLOCK_4OWORDS    2
+
+#define GEN6_DATAPORT_DWORD_SCATTERED_BLOCK_8DWORDS   2
+#define GEN6_DATAPORT_DWORD_SCATTERED_BLOCK_16DWORDS  3
+
+#define GEN6_DATAPORT_READ_MESSAGE_OWORD_BLOCK_READ          0
+#define GEN6_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ     1
+#define GEN6_DATAPORT_READ_MESSAGE_DWORD_BLOCK_READ          2
+#define GEN6_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ      3
+
+#define GEN6_DATAPORT_READ_TARGET_DATA_CACHE      0
+#define GEN6_DATAPORT_READ_TARGET_RENDER_CACHE    1
+#define GEN6_DATAPORT_READ_TARGET_SAMPLER_CACHE   2
+
+#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE                0
+#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE_REPLICATED     1
+#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN01         2
+#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN23         3
+#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_SINGLE_SOURCE_SUBSPAN01       4
+
+#define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE                0
+#define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE           1
+#define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_BLOCK_WRITE                2
+#define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE            3
+#define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE              4
+#define GEN6_DATAPORT_WRITE_MESSAGE_STREAMED_VERTEX_BUFFER_WRITE     5
+#define GEN6_DATAPORT_WRITE_MESSAGE_FLUSH_RENDER_CACHE               7
+
+#define GEN6_MATH_FUNCTION_INV                              1
+#define GEN6_MATH_FUNCTION_LOG                              2
+#define GEN6_MATH_FUNCTION_EXP                              3
+#define GEN6_MATH_FUNCTION_SQRT                             4
+#define GEN6_MATH_FUNCTION_RSQ                              5
+#define GEN6_MATH_FUNCTION_SIN                              6 /* was 7 */
+#define GEN6_MATH_FUNCTION_COS                              7 /* was 8 */
+#define GEN6_MATH_FUNCTION_SINCOS                           8 /* was 6 */
+#define GEN6_MATH_FUNCTION_TAN                              9
+#define GEN6_MATH_FUNCTION_POW                              10
+#define GEN6_MATH_FUNCTION_INT_DIV_QUOTIENT_AND_REMAINDER   11
+#define GEN6_MATH_FUNCTION_INT_DIV_QUOTIENT                 12
+#define GEN6_MATH_FUNCTION_INT_DIV_REMAINDER                13
+
+#define GEN6_MATH_INTEGER_UNSIGNED     0
+#define GEN6_MATH_INTEGER_SIGNED       1
+
+#define GEN6_MATH_PRECISION_FULL        0
+#define GEN6_MATH_PRECISION_PARTIAL     1
+
+#define GEN6_MATH_SATURATE_NONE         0
+#define GEN6_MATH_SATURATE_SATURATE     1
+
+#define GEN6_MATH_DATA_VECTOR  0
+#define GEN6_MATH_DATA_SCALAR  1
+
+#define GEN6_URB_OPCODE_WRITE  0
+
+#define GEN6_URB_SWIZZLE_NONE          0
+#define GEN6_URB_SWIZZLE_INTERLEAVE    1
+#define GEN6_URB_SWIZZLE_TRANSPOSE     2
+
+#define GEN6_SCRATCH_SPACE_SIZE_1K     0
+#define GEN6_SCRATCH_SPACE_SIZE_2K     1
+#define GEN6_SCRATCH_SPACE_SIZE_4K     2
+#define GEN6_SCRATCH_SPACE_SIZE_8K     3
+#define GEN6_SCRATCH_SPACE_SIZE_16K    4
+#define GEN6_SCRATCH_SPACE_SIZE_32K    5
+#define GEN6_SCRATCH_SPACE_SIZE_64K    6
+#define GEN6_SCRATCH_SPACE_SIZE_128K   7
+#define GEN6_SCRATCH_SPACE_SIZE_256K   8
+#define GEN6_SCRATCH_SPACE_SIZE_512K   9
+#define GEN6_SCRATCH_SPACE_SIZE_1M     10
+#define GEN6_SCRATCH_SPACE_SIZE_2M     11
+
+/* The hardware supports two different modes for border color. The
+ * default (OpenGL) mode uses floating-point color channels, while the
+ * legacy mode uses 4 bytes.
+ *
+ * More significantly, the legacy mode respects the components of the
+ * border color for channels not present in the source, (whereas the
+ * default mode will ignore the border color's alpha channel and use
+ * alpha==1 for an RGB source, for example).
+ *
+ * The legacy mode matches the semantics specified by the Render
+ * extension.
+ */
+struct gen6_sampler_default_border_color {
+   float color[4];
+};
+
+struct gen6_sampler_legacy_border_color {
+   uint8_t color[4];
+};
+
+struct gen6_sampler_state {
+   struct {
+      uint32_t shadow_function:3;
+      uint32_t lod_bias:11;
+      uint32_t min_filter:3;
+      uint32_t mag_filter:3;
+      uint32_t mip_filter:2;
+      uint32_t base_level:5;
+      uint32_t pad:1;
+      uint32_t lod_preclamp:1;
+      uint32_t border_color_mode:1;
+      uint32_t pad0:1;
+      uint32_t disable:1;
+   } ss0;
+
+   struct {
+      uint32_t r_wrap_mode:3;
+      uint32_t t_wrap_mode:3;
+      uint32_t s_wrap_mode:3;
+      uint32_t pad:3;
+      uint32_t max_lod:10;
+      uint32_t min_lod:10;
+   } ss1;
+
+   struct {
+      uint32_t border_color;
+   } ss2;
+
+   struct {
+      uint32_t pad:19;
+      uint32_t max_aniso:3;
+      uint32_t chroma_key_mode:1;
+      uint32_t chroma_key_index:2;
+      uint32_t chroma_key_enable:1;
+      uint32_t monochrome_filter_width:3;
+      uint32_t monochrome_filter_height:3;
+   } ss3;
+};
+
+struct gen6_blend_state {
+	struct {
+		uint32_t dest_blend_factor:5;
+		uint32_t source_blend_factor:5;
+		uint32_t pad3:1;
+		uint32_t blend_func:3;
+		uint32_t pad2:1;
+		uint32_t ia_dest_blend_factor:5;
+		uint32_t ia_source_blend_factor:5;
+		uint32_t pad1:1;
+		uint32_t ia_blend_func:3;
+		uint32_t pad0:1;
+		uint32_t ia_blend_enable:1;
+		uint32_t blend_enable:1;
+	} blend0;
+
+	struct {
+		uint32_t post_blend_clamp_enable:1;
+		uint32_t pre_blend_clamp_enable:1;
+		uint32_t clamp_range:2;
+		uint32_t pad0:4;
+		uint32_t x_dither_offset:2;
+		uint32_t y_dither_offset:2;
+		uint32_t dither_enable:1;
+		uint32_t alpha_test_func:3;
+		uint32_t alpha_test_enable:1;
+		uint32_t pad1:1;
+		uint32_t logic_op_func:4;
+		uint32_t logic_op_enable:1;
+		uint32_t pad2:1;
+		uint32_t write_disable_b:1;
+		uint32_t write_disable_g:1;
+		uint32_t write_disable_r:1;
+		uint32_t write_disable_a:1;
+		uint32_t pad3:1;
+		uint32_t alpha_to_coverage_dither:1;
+		uint32_t alpha_to_one:1;
+		uint32_t alpha_to_coverage:1;
+	} blend1;
+};
+
+struct gen6_color_calc_state {
+	struct {
+		uint32_t alpha_test_format:1;
+		uint32_t pad0:14;
+		uint32_t round_disable:1;
+		uint32_t bf_stencil_ref:8;
+		uint32_t stencil_ref:8;
+	} cc0;
+
+	union {
+		float alpha_ref_f;
+		struct {
+			uint32_t ui:8;
+			uint32_t pad0:24;
+		} alpha_ref_fi;
+	} cc1;
+
+	float constant_r;
+	float constant_g;
+	float constant_b;
+	float constant_a;
+};
+
+struct gen6_depth_stencil_state {
+	struct {
+		uint32_t pad0:3;
+		uint32_t bf_stencil_pass_depth_pass_op:3;
+		uint32_t bf_stencil_pass_depth_fail_op:3;
+		uint32_t bf_stencil_fail_op:3;
+		uint32_t bf_stencil_func:3;
+		uint32_t bf_stencil_enable:1;
+		uint32_t pad1:2;
+		uint32_t stencil_write_enable:1;
+		uint32_t stencil_pass_depth_pass_op:3;
+		uint32_t stencil_pass_depth_fail_op:3;
+		uint32_t stencil_fail_op:3;
+		uint32_t stencil_func:3;
+		uint32_t stencil_enable:1;
+	} ds0;
+
+	struct {
+		uint32_t bf_stencil_write_mask:8;
+		uint32_t bf_stencil_test_mask:8;
+		uint32_t stencil_write_mask:8;
+		uint32_t stencil_test_mask:8;
+	} ds1;
+
+	struct {
+		uint32_t pad0:26;
+		uint32_t depth_write_enable:1;
+		uint32_t depth_test_func:3;
+		uint32_t pad1:1;
+		uint32_t depth_test_enable:1;
+	} ds2;
+};
+
+struct gen6_surface_state {
+	struct {
+		uint32_t cube_pos_z:1;
+		uint32_t cube_neg_z:1;
+		uint32_t cube_pos_y:1;
+		uint32_t cube_neg_y:1;
+		uint32_t cube_pos_x:1;
+		uint32_t cube_neg_x:1;
+		uint32_t pad:3;
+		uint32_t render_cache_read_mode:1;
+		uint32_t mipmap_layout_mode:1;
+		uint32_t vert_line_stride_ofs:1;
+		uint32_t vert_line_stride:1;
+		uint32_t color_blend:1;
+		uint32_t writedisable_blue:1;
+		uint32_t writedisable_green:1;
+		uint32_t writedisable_red:1;
+		uint32_t writedisable_alpha:1;
+		uint32_t surface_format:9;
+		uint32_t data_return_format:1;
+		uint32_t pad0:1;
+		uint32_t surface_type:3;
+	} ss0;
+
+	struct {
+		uint32_t base_addr;
+	} ss1;
+
+	struct {
+		uint32_t render_target_rotation:2;
+		uint32_t mip_count:4;
+		uint32_t width:13;
+		uint32_t height:13;
+	} ss2;
+
+	struct {
+		uint32_t tile_walk:1;
+		uint32_t tiled_surface:1;
+		uint32_t pad:1;
+		uint32_t pitch:18;
+		uint32_t depth:11;
+	} ss3;
+
+	struct {
+		uint32_t pad:19;
+		uint32_t min_array_elt:9;
+		uint32_t min_lod:4;
+	} ss4;
+
+	struct {
+		uint32_t pad:20;
+		uint32_t y_offset:4;
+		uint32_t pad2:1;
+		uint32_t x_offset:7;
+	} ss5;
+};
+
+struct gen6_cc_viewport {
+	float min_depth;
+	float max_depth;
+};
+
+typedef enum {
+	SAMPLER_FILTER_NEAREST = 0,
+	SAMPLER_FILTER_BILINEAR,
+	FILTER_COUNT
+} sampler_filter_t;
+
+typedef enum {
+	SAMPLER_EXTEND_NONE = 0,
+	SAMPLER_EXTEND_REPEAT,
+	SAMPLER_EXTEND_PAD,
+	SAMPLER_EXTEND_REFLECT,
+	EXTEND_COUNT
+} sampler_extend_t;
+
+#endif
diff --git a/lib/intel_gpu_tools.h b/lib/intel_gpu_tools.h
index f2134bf..cd964bd 100644
--- a/lib/intel_gpu_tools.h
+++ b/lib/intel_gpu_tools.h
@@ -25,6 +25,9 @@
  *
  */
 
+#ifndef _IGT_H_
+#define _IGT_H_
+
 #include <stdint.h>
 #include <sys/types.h>
 #include <pciaccess.h>
@@ -93,3 +96,5 @@ extern enum pch_type pch;
 void intel_check_pch(void);
 
 #define HAS_CPT (pch == PCH_CPT)
+
+#endif
diff --git a/tests/Makefile.am b/tests/Makefile.am
index 190d2d3..6fdc96f 100644
--- a/tests/Makefile.am
+++ b/tests/Makefile.am
@@ -6,11 +6,6 @@ noinst_PROGRAMS = \
 
 gem_stress_SOURCES = \
 	gem_stress.c \
-	gem_stress.h \
-	gem_stress_i915.c \
-	gem_stress_i830.c \
-	gen6_render.h \
-	gem_stress_gen6.c \
 	$(NULL)
 
 TESTS_progs = \
diff --git a/tests/gem_stress.c b/tests/gem_stress.c
index 7f93964..8338705 100644
--- a/tests/gem_stress.c
+++ b/tests/gem_stress.c
@@ -297,22 +297,31 @@ static void render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned sr
 			    struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
 			    unsigned logical_tile_no)
 {
-	if (IS_GEN2(devid))
+
+	if (IS_GEN2(devid)) {
 		gen2_render_copyfunc(src, src_x, src_y,
 				     dst, dst_x, dst_y,
 				     logical_tile_no);
-	else if (IS_GEN3(devid))
+		intel_batchbuffer_flush(batch);
+	} else if (IS_GEN3(devid)) {
 		gen3_render_copyfunc(src, src_x, src_y,
 				     dst, dst_x, dst_y,
 				     logical_tile_no);
-	else if (IS_GEN6(devid))
-		gen6_render_copyfunc(src, src_x, src_y,
-				     dst, dst_x, dst_y,
-				     logical_tile_no);
-	else
+		intel_batchbuffer_flush(batch);
+	} else if (IS_GEN6(devid)) {
+		uint32_t ret;
+		intel_batchbuffer_flush(batch);
+		ret = gen6_render_copyfunc(src, src_x, src_y,
+					   dst, dst_x, dst_y,
+					   logical_tile_no);
+		gen6_render_flush(ret);
+		intel_batchbuffer_reset(batch);
+	} else {
 		blitter_copyfunc(src, src_x, src_y,
 				 dst, dst_x, dst_y,
 				 logical_tile_no);
+	}
+
 }
 
 static void next_copyfunc(int tile)
diff --git a/tests/gem_stress.h b/tests/gem_stress.h
deleted file mode 100644
index f44773d..0000000
--- a/tests/gem_stress.h
+++ /dev/null
@@ -1,100 +0,0 @@
-#include <stdlib.h>
-#include <sys/ioctl.h>
-#include <stdio.h>
-#include <string.h>
-#include <assert.h>
-#include <fcntl.h>
-#include <inttypes.h>
-#include <errno.h>
-#include <sys/stat.h>
-#include <sys/time.h>
-#include <getopt.h>
-#include "drm.h"
-#include "i915_drm.h"
-#include "drmtest.h"
-#include "intel_bufmgr.h"
-#include "intel_batchbuffer.h"
-#include "intel_gpu_tools.h"
-
-struct scratch_buf {
-    drm_intel_bo *bo;
-    uint32_t stride;
-    uint32_t tiling;
-    uint32_t *data;
-    uint32_t *cpu_mapping;
-    unsigned num_tiles;
-};
-
-struct option_struct {
-    unsigned scratch_buf_size;
-    unsigned max_dimension;
-    unsigned num_buffers;
-    int trace_tile;
-    int no_hw;
-    int gpu_busy_load;
-    int use_render;
-    int use_blt;
-    int forced_tiling;
-    int use_cpu_maps;
-    int total_rounds;
-    int fail;
-    int tiles_per_buf;
-    int ducttape;
-    int tile_size;
-    int check_render_cpyfn;
-    int use_signal_helper;
-};
-
-extern struct option_struct options;
-extern drm_intel_bufmgr *bufmgr;
-extern struct intel_batchbuffer *batch;
-extern int drm_fd;
-extern int devid;
-
-extern int fence_storm;
-
-#define MAX_BUFS		4096
-#define SCRATCH_BUF_SIZE	1024*1024
-#define BUSY_BUF_SIZE		(256*4096)
-#define TILE_BYTES(size)	((size)*(size)*sizeof(uint32_t))
-
-void keep_gpu_busy(void);
-
-static inline void emit_vertex_2s(int16_t x, int16_t y)
-{
-	OUT_BATCH((uint16_t)y << 16 | (uint16_t)x);
-}
-
-static inline void emit_vertex(float f)
-{
-	union { float f; uint32_t ui; } u;
-	u.f = f;
-	OUT_BATCH(u.ui);
-}
-
-static inline void emit_vertex_normalized(float f, float total)
-{
-	union { float f; uint32_t ui; } u;
-	u.f = f / total;
-	OUT_BATCH(u.ui);
-}
-
-static inline unsigned buf_width(struct scratch_buf *buf)
-{
-	return buf->stride/sizeof(uint32_t);
-}
-
-static inline unsigned buf_height(struct scratch_buf *buf)
-{
-	return options.scratch_buf_size/buf->stride;
-}
-
-void gen6_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no);
-void gen3_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no);
-void gen2_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no);
diff --git a/tests/gem_stress_gen6.c b/tests/gem_stress_gen6.c
deleted file mode 100644
index 735c489..0000000
--- a/tests/gem_stress_gen6.c
+++ /dev/null
@@ -1,595 +0,0 @@
-#include "gem_stress.h"
-#include "gen6_render.h"
-
-#include <assert.h>
-
-#define ALIGN(x, y) (((x) + (y)-1) & ~((y)-1))
-#define VERTEX_SIZE (3*4)
-
-static const uint32_t ps_kernel_nomask_affine[][4] = {
-	{ 0x0060005a, 0x204077be, 0x000000c0, 0x008d0040 },
-	{ 0x0060005a, 0x206077be, 0x000000c0, 0x008d0080 },
-	{ 0x0060005a, 0x208077be, 0x000000d0, 0x008d0040 },
-	{ 0x0060005a, 0x20a077be, 0x000000d0, 0x008d0080 },
-	{ 0x00000201, 0x20080061, 0x00000000, 0x00000000 },
-	{ 0x00600001, 0x20200022, 0x008d0000, 0x00000000 },
-	{ 0x02800031, 0x21c01cc9, 0x00000020, 0x0a8a0001 },
-	{ 0x00600001, 0x204003be, 0x008d01c0, 0x00000000 },
-	{ 0x00600001, 0x206003be, 0x008d01e0, 0x00000000 },
-	{ 0x00600001, 0x208003be, 0x008d0200, 0x00000000 },
-	{ 0x00600001, 0x20a003be, 0x008d0220, 0x00000000 },
-	{ 0x00600001, 0x20c003be, 0x008d0240, 0x00000000 },
-	{ 0x00600001, 0x20e003be, 0x008d0260, 0x00000000 },
-	{ 0x00600001, 0x210003be, 0x008d0280, 0x00000000 },
-	{ 0x00600001, 0x212003be, 0x008d02a0, 0x00000000 },
-	{ 0x05800031, 0x24001cc8, 0x00000040, 0x90019000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-	{ 0x0000007e, 0x00000000, 0x00000000, 0x00000000 },
-};
-
-static uint32_t
-batch_used(void)
-{
-	return batch->ptr - batch->buffer;
-}
-
-static uint32_t
-batch_align(uint32_t align)
-{
-	uint32_t offset = batch_used();
-	offset = ALIGN(offset, align);
-	batch->ptr = batch->buffer + offset;
-	return offset;
-}
-
-static uint32_t
-batch_round_upto(uint32_t divisor)
-{
-	uint32_t offset = batch_used();
-	offset = (offset + divisor-1) / divisor * divisor;
-	batch->ptr = batch->buffer + offset;
-	return offset;
-}
-
-static void *
-batch_alloc(uint32_t size, uint32_t align)
-{
-	uint32_t offset = batch_align(align);
-	batch->ptr += size;
-	return memset(batch->buffer + offset, 0, size);
-}
-
-static uint32_t
-batch_offset(void *ptr)
-{
-	return (uint8_t *)ptr - batch->buffer;
-}
-
-static uint32_t
-batch_copy(const void *ptr, uint32_t size, uint32_t align)
-{
-	return batch_offset(memcpy(batch_alloc(size, align), ptr, size));
-}
-
-static void
-gen6_render_flush(uint32_t batch_end)
-{
-	int ret;
-
-	ret = drm_intel_bo_subdata(batch->bo, 0, 4096, batch->buffer);
-	if (ret == 0)
-		ret = drm_intel_bo_mrb_exec(batch->bo, batch_end,
-					    NULL, 0, 0, 0);
-	assert(ret == 0);
-}
-
-static uint32_t
-gen6_bind_buf(struct scratch_buf *buf,
-	      uint32_t format, int is_dst)
-{
-	struct gen6_surface_state *ss;
-	uint32_t write_domain, read_domain;
-	int ret;
-
-	if (is_dst) {
-		write_domain = read_domain = I915_GEM_DOMAIN_RENDER;
-	} else {
-		write_domain = 0;
-		read_domain = I915_GEM_DOMAIN_SAMPLER;
-	}
-
-	ss = batch_alloc(sizeof(*ss), 32);
-	ss->ss0.surface_type = GEN6_SURFACE_2D;
-	ss->ss0.surface_format = format;
-
-	ss->ss0.data_return_format = GEN6_SURFACERETURNFORMAT_FLOAT32;
-	ss->ss0.color_blend = 1;
-	ss->ss1.base_addr = buf->bo->offset;
-
-	ret = drm_intel_bo_emit_reloc(batch->bo,
-				      batch_offset(ss) + 4,
-				      buf->bo, 0,
-				      read_domain, write_domain);
-	assert(ret == 0);
-
-	ss->ss2.height = buf_height(buf) - 1;
-	ss->ss2.width  = buf_width(buf) - 1;
-	ss->ss3.pitch  = buf->stride - 1;
-	ss->ss3.tiled_surface = buf->tiling != I915_TILING_NONE;
-	ss->ss3.tile_walk     = buf->tiling == I915_TILING_Y;
-
-	return batch_offset(ss);
-}
-
-static uint32_t
-gen6_bind_surfaces(struct scratch_buf *src,
-		   struct scratch_buf *dst)
-{
-	uint32_t *binding_table;
-
-	binding_table = batch_alloc(32, 32);
-
-	binding_table[0] =
-		gen6_bind_buf(dst, GEN6_SURFACEFORMAT_B8G8R8A8_UNORM, 1);
-	binding_table[1] =
-		gen6_bind_buf(src, GEN6_SURFACEFORMAT_B8G8R8A8_UNORM, 0);
-
-	return batch_offset(binding_table);
-}
-
-static void
-gen6_emit_sip(void)
-{
-	OUT_BATCH(GEN6_STATE_SIP | 0);
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_urb(void)
-{
-	OUT_BATCH(GEN6_3DSTATE_URB | (3 - 2));
-	OUT_BATCH((1 - 1) << GEN6_3DSTATE_URB_VS_SIZE_SHIFT |
-		  24 << GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT); /* at least 24 on GEN6 */
-	OUT_BATCH(0 << GEN6_3DSTATE_URB_GS_SIZE_SHIFT |
-		  0 << GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT); /* no GS thread */
-}
-
-static void
-gen6_emit_state_base_address(void)
-{
-	OUT_BATCH(GEN6_STATE_BASE_ADDRESS | (10 - 2));
-	OUT_BATCH(0); /* general */
-	OUT_RELOC(batch->bo, /* surface */
-		  I915_GEM_DOMAIN_INSTRUCTION, 0,
-		  BASE_ADDRESS_MODIFY);
-	OUT_RELOC(batch->bo, /* instruction */
-		  I915_GEM_DOMAIN_INSTRUCTION, 0,
-		  BASE_ADDRESS_MODIFY);
-	OUT_BATCH(0); /* indirect */
-	OUT_RELOC(batch->bo, /* dynamic */
-		  I915_GEM_DOMAIN_INSTRUCTION, 0,
-		  BASE_ADDRESS_MODIFY);
-
-	/* upper bounds, disable */
-	OUT_BATCH(0);
-	OUT_BATCH(BASE_ADDRESS_MODIFY);
-	OUT_BATCH(0);
-	OUT_BATCH(BASE_ADDRESS_MODIFY);
-}
-
-static void
-gen6_emit_viewports(uint32_t cc_vp)
-{
-	OUT_BATCH(GEN6_3DSTATE_VIEWPORT_STATE_POINTERS |
-		  GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC |
-		  (4 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(cc_vp);
-}
-
-static void
-gen6_emit_vs(void)
-{
-	/* disable VS constant buffer */
-	OUT_BATCH(GEN6_3DSTATE_CONSTANT_VS | (5 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-
-	OUT_BATCH(GEN6_3DSTATE_VS | (6 - 2));
-	OUT_BATCH(0); /* no VS kernel */
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* pass-through */
-}
-
-static void
-gen6_emit_gs(void)
-{
-	/* disable GS constant buffer */
-	OUT_BATCH(GEN6_3DSTATE_CONSTANT_GS | (5 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-
-	OUT_BATCH(GEN6_3DSTATE_GS | (7 - 2));
-	OUT_BATCH(0); /* no GS kernel */
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* pass-through */
-}
-
-static void
-gen6_emit_clip(void)
-{
-	OUT_BATCH(GEN6_3DSTATE_CLIP | (4 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* pass-through */
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_wm_constants(void)
-{
-	/* disable WM constant buffer */
-	OUT_BATCH(GEN6_3DSTATE_CONSTANT_PS | (5 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_null_depth_buffer(void)
-{
-	OUT_BATCH(GEN6_3DSTATE_DEPTH_BUFFER | (7 - 2));
-	OUT_BATCH(GEN6_SURFACE_NULL << GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT |
-		  GEN6_DEPTHFORMAT_D32_FLOAT << GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-
-	OUT_BATCH(GEN6_3DSTATE_CLEAR_PARAMS | (2 - 2));
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_invariant(void)
-{
-	OUT_BATCH(GEN6_PIPELINE_SELECT | PIPELINE_SELECT_3D);
-
-	OUT_BATCH(GEN6_3DSTATE_MULTISAMPLE | (3 - 2));
-	OUT_BATCH(GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER |
-		  GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1); /* 1 sample/pixel */
-	OUT_BATCH(0);
-
-	OUT_BATCH(GEN6_3DSTATE_SAMPLE_MASK | (2 - 2));
-	OUT_BATCH(1);
-}
-
-static void
-gen6_emit_cc(uint32_t blend)
-{
-	OUT_BATCH(GEN6_3DSTATE_CC_STATE_POINTERS | (4 - 2));
-	OUT_BATCH(blend | 1);
-	OUT_BATCH(1024 | 1);
-	OUT_BATCH(1024 | 1);
-}
-
-static void
-gen6_emit_sampler(uint32_t state)
-{
-	OUT_BATCH(GEN6_3DSTATE_SAMPLER_STATE_POINTERS |
-		  GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS |
-		  (4 - 2));
-	OUT_BATCH(0); /* VS */
-	OUT_BATCH(0); /* GS */
-	OUT_BATCH(state);
-}
-
-static void
-gen6_emit_sf(void)
-{
-	OUT_BATCH(GEN6_3DSTATE_SF | (20 - 2));
-	OUT_BATCH(1 << GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT |
-		  1 << GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT |
-		  1 << GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT);
-	OUT_BATCH(0);
-	OUT_BATCH(GEN6_3DSTATE_SF_CULL_NONE);
-	OUT_BATCH(2 << GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT); /* DW4 */
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* DW9 */
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* DW14 */
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-	OUT_BATCH(0); /* DW19 */
-}
-
-static void
-gen6_emit_wm(int kernel)
-{
-	OUT_BATCH(GEN6_3DSTATE_WM | (9 - 2));
-	OUT_BATCH(kernel);
-	OUT_BATCH(1 << GEN6_3DSTATE_WM_SAMPLER_COUNT_SHIFT |
-		  2 << GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT);
-	OUT_BATCH(0);
-	OUT_BATCH(6 << GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT); /* DW4 */
-	OUT_BATCH((40 - 1) << GEN6_3DSTATE_WM_MAX_THREADS_SHIFT |
-		  GEN6_3DSTATE_WM_DISPATCH_ENABLE |
-		  GEN6_3DSTATE_WM_16_DISPATCH_ENABLE);
-	OUT_BATCH(1 << GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT |
-		  GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC);
-	OUT_BATCH(0);
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_binding_table(uint32_t wm_table)
-{
-	OUT_BATCH(GEN6_3DSTATE_BINDING_TABLE_POINTERS |
-		  GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS |
-		  (4 - 2));
-	OUT_BATCH(0);		/* vs */
-	OUT_BATCH(0);		/* gs */
-	OUT_BATCH(wm_table);
-}
-
-static void
-gen6_emit_drawing_rectangle(struct scratch_buf *dst)
-{
-	OUT_BATCH(GEN6_3DSTATE_DRAWING_RECTANGLE | (4 - 2));
-	OUT_BATCH(0);
-	OUT_BATCH((buf_height(dst) - 1) << 16 | (buf_width(dst) - 1));
-	OUT_BATCH(0);
-}
-
-static void
-gen6_emit_vertex_elements(void)
-{
-	/* The VUE layout
-	 *    dword 0-3: pad (0.0, 0.0, 0.0. 0.0)
-	 *    dword 4-7: position (x, y, 1.0, 1.0),
-	 *    dword 8-11: texture coordinate 0 (u0, v0, 0, 0)
-	 *
-	 * dword 4-11 are fetched from vertex buffer
-	 */
-	OUT_BATCH(GEN6_3DSTATE_VERTEX_ELEMENTS | (2 * 3 + 1 - 2));
-
-	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
-		  GEN6_SURFACEFORMAT_R32G32B32A32_FLOAT << VE0_FORMAT_SHIFT |
-		  0 << VE0_OFFSET_SHIFT);
-	OUT_BATCH(GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_0_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_1_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_2_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_3_SHIFT);
-
-	/* x,y */
-	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
-		  GEN6_SURFACEFORMAT_R16G16_SSCALED << VE0_FORMAT_SHIFT |
-		  0 << VE0_OFFSET_SHIFT); /* offsets vb in bytes */
-	OUT_BATCH(GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_0_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_1_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_1_FLT << VE1_VFCOMPONENT_2_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_1_FLT << VE1_VFCOMPONENT_3_SHIFT);
-
-	/* u0, v0 */
-	OUT_BATCH(0 << VE0_VERTEX_BUFFER_INDEX_SHIFT | VE0_VALID |
-		  GEN6_SURFACEFORMAT_R32G32_FLOAT << VE0_FORMAT_SHIFT |
-		  4 << VE0_OFFSET_SHIFT);	/* offset vb in bytes */
-	OUT_BATCH(GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_0_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_SRC << VE1_VFCOMPONENT_1_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_2_SHIFT |
-		  GEN6_VFCOMPONENT_STORE_0 << VE1_VFCOMPONENT_3_SHIFT);
-}
-
-static uint32_t
-gen6_create_cc_viewport(void)
-{
-	struct gen6_cc_viewport *vp;
-
-	vp = batch_alloc(sizeof(*vp), 32);
-
-	vp->min_depth = -1.e35;
-	vp->max_depth = 1.e35;
-
-	return batch_offset(vp);
-}
-
-static uint32_t
-gen6_create_cc_blend(void)
-{
-	struct gen6_blend_state *blend;
-
-	blend = batch_alloc(sizeof(*blend), 64);
-
-	blend->blend0.dest_blend_factor = GEN6_BLENDFACTOR_ZERO;
-	blend->blend0.source_blend_factor = GEN6_BLENDFACTOR_ONE;
-	blend->blend0.blend_func = GEN6_BLENDFUNCTION_ADD;
-	blend->blend0.blend_enable = 1;
-
-	blend->blend1.post_blend_clamp_enable = 1;
-	blend->blend1.pre_blend_clamp_enable = 1;
-
-	return batch_offset(blend);
-}
-
-static uint32_t
-gen6_create_kernel(void)
-{
-	return batch_copy(ps_kernel_nomask_affine,
-			  sizeof(ps_kernel_nomask_affine),
-			  64);
-}
-
-static uint32_t
-gen6_create_sampler(sampler_filter_t filter,
-		   sampler_extend_t extend)
-{
-	struct gen6_sampler_state *ss;
-
-	ss = batch_alloc(sizeof(*ss), 32);
-	ss->ss0.lod_preclamp = 1;	/* GL mode */
-
-	/* We use the legacy mode to get the semantics specified by
-	 * the Render extension. */
-	ss->ss0.border_color_mode = GEN6_BORDER_COLOR_MODE_LEGACY;
-
-	switch (filter) {
-	default:
-	case SAMPLER_FILTER_NEAREST:
-		ss->ss0.min_filter = GEN6_MAPFILTER_NEAREST;
-		ss->ss0.mag_filter = GEN6_MAPFILTER_NEAREST;
-		break;
-	case SAMPLER_FILTER_BILINEAR:
-		ss->ss0.min_filter = GEN6_MAPFILTER_LINEAR;
-		ss->ss0.mag_filter = GEN6_MAPFILTER_LINEAR;
-		break;
-	}
-
-	switch (extend) {
-	default:
-	case SAMPLER_EXTEND_NONE:
-		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
-		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
-		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_CLAMP_BORDER;
-		break;
-	case SAMPLER_EXTEND_REPEAT:
-		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
-		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
-		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_WRAP;
-		break;
-	case SAMPLER_EXTEND_PAD:
-		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
-		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
-		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_CLAMP;
-		break;
-	case SAMPLER_EXTEND_REFLECT:
-		ss->ss1.r_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
-		ss->ss1.s_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
-		ss->ss1.t_wrap_mode = GEN6_TEXCOORDMODE_MIRROR;
-		break;
-	}
-
-	return batch_offset(ss);
-}
-
-static void gen6_emit_vertex_buffer(void)
-{
-	OUT_BATCH(GEN6_3DSTATE_VERTEX_BUFFERS | 3);
-	OUT_BATCH(VB0_VERTEXDATA |
-		  0 << VB0_BUFFER_INDEX_SHIFT |
-		  VERTEX_SIZE << VB0_BUFFER_PITCH_SHIFT);
-	OUT_RELOC(batch->bo, I915_GEM_DOMAIN_VERTEX, 0, 0);
-	OUT_RELOC(batch->bo, I915_GEM_DOMAIN_VERTEX, 0, batch->bo->size-1);
-	OUT_BATCH(0);
-}
-
-static uint32_t gen6_emit_primitive(void)
-{
-	uint32_t offset;
-
-	OUT_BATCH(GEN6_3DPRIMITIVE |
-		  GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL |
-		  _3DPRIM_RECTLIST << GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT |
-		  0 << 9 |
-		  4);
-	OUT_BATCH(3);	/* vertex count */
-	offset = batch_used();
-	OUT_BATCH(0);	/* vertex_index */
-	OUT_BATCH(1);	/* single instance */
-	OUT_BATCH(0);	/* start instance location */
-	OUT_BATCH(0);	/* index buffer offset, ignored */
-
-	return offset;
-}
-
-void gen6_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no)
-{
-	uint32_t wm_state, wm_kernel, wm_table;
-	uint32_t cc_vp, cc_blend, offset;
-	uint32_t batch_end;
-
-	intel_batchbuffer_flush(batch);
-
-	batch->ptr = batch->buffer + 1024;
-	batch_alloc(64, 64);
-	wm_table  = gen6_bind_surfaces(src, dst);
-	wm_kernel = gen6_create_kernel();
-	wm_state  = gen6_create_sampler(SAMPLER_FILTER_NEAREST,
-					SAMPLER_EXTEND_NONE);
-
-	cc_vp = gen6_create_cc_viewport();
-	cc_blend = gen6_create_cc_blend();
-
-	batch->ptr = batch->buffer;
-
-	gen6_emit_invariant();
-	gen6_emit_state_base_address();
-
-	gen6_emit_sip();
-	gen6_emit_urb();
-
-	gen6_emit_viewports(cc_vp);
-	gen6_emit_vs();
-	gen6_emit_gs();
-	gen6_emit_clip();
-	gen6_emit_wm_constants();
-	gen6_emit_null_depth_buffer();
-
-	gen6_emit_drawing_rectangle(dst);
-	gen6_emit_cc(cc_blend);
-	gen6_emit_sampler(wm_state);
-	gen6_emit_sf();
-	gen6_emit_wm(wm_kernel);
-	gen6_emit_vertex_elements();
-	gen6_emit_binding_table(wm_table);
-
-	gen6_emit_vertex_buffer();
-	offset = gen6_emit_primitive();
-
-	OUT_BATCH(MI_BATCH_BUFFER_END);
-	batch_end = batch_align(8);
-
-	*(uint32_t*)(batch->buffer + offset) =
-		batch_round_upto(VERTEX_SIZE)/VERTEX_SIZE;
-
-	emit_vertex_2s(dst_x + options.tile_size, dst_y + options.tile_size);
-	emit_vertex_normalized(src_x + options.tile_size, buf_width(src));
-	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
-
-	emit_vertex_2s(dst_x, dst_y + options.tile_size);
-	emit_vertex_normalized(src_x, buf_width(src));
-	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
-
-	emit_vertex_2s(dst_x, dst_y);
-	emit_vertex_normalized(src_x, buf_width(src));
-	emit_vertex_normalized(src_y, buf_height(src));
-
-	gen6_render_flush(batch_end);
-	intel_batchbuffer_reset(batch);
-}
diff --git a/tests/gem_stress_i830.c b/tests/gem_stress_i830.c
deleted file mode 100644
index 317a492..0000000
--- a/tests/gem_stress_i830.c
+++ /dev/null
@@ -1,354 +0,0 @@
-#include "i830_reg.h"
-#include "gem_stress.h"
-
-#define TB0C_LAST_STAGE	(1 << 31)
-#define TB0C_RESULT_SCALE_1X		(0 << 29)
-#define TB0C_RESULT_SCALE_2X		(1 << 29)
-#define TB0C_RESULT_SCALE_4X		(2 << 29)
-#define TB0C_OP_MODULE			(3 << 25)
-#define TB0C_OUTPUT_WRITE_CURRENT	(0 << 24)
-#define TB0C_OUTPUT_WRITE_ACCUM		(1 << 24)
-#define TB0C_ARG3_REPLICATE_ALPHA 	(1<<23)
-#define TB0C_ARG3_INVERT		(1<<22)
-#define TB0C_ARG3_SEL_XXX
-#define TB0C_ARG2_REPLICATE_ALPHA 	(1<<17)
-#define TB0C_ARG2_INVERT		(1<<16)
-#define TB0C_ARG2_SEL_ONE		(0 << 12)
-#define TB0C_ARG2_SEL_FACTOR		(1 << 12)
-#define TB0C_ARG2_SEL_TEXEL0		(6 << 12)
-#define TB0C_ARG2_SEL_TEXEL1		(7 << 12)
-#define TB0C_ARG2_SEL_TEXEL2		(8 << 12)
-#define TB0C_ARG2_SEL_TEXEL3		(9 << 12)
-#define TB0C_ARG1_REPLICATE_ALPHA 	(1<<11)
-#define TB0C_ARG1_INVERT		(1<<10)
-#define TB0C_ARG1_SEL_ONE		(0 << 6)
-#define TB0C_ARG1_SEL_TEXEL0		(6 << 6)
-#define TB0C_ARG1_SEL_TEXEL1		(7 << 6)
-#define TB0C_ARG1_SEL_TEXEL2		(8 << 6)
-#define TB0C_ARG1_SEL_TEXEL3		(9 << 6)
-#define TB0C_ARG0_REPLICATE_ALPHA 	(1<<5)
-#define TB0C_ARG0_SEL_XXX
-
-#define TB0A_CTR_STAGE_ENABLE 		(1<<31)
-#define TB0A_RESULT_SCALE_1X		(0 << 29)
-#define TB0A_RESULT_SCALE_2X		(1 << 29)
-#define TB0A_RESULT_SCALE_4X		(2 << 29)
-#define TB0A_OP_MODULE			(3 << 25)
-#define TB0A_OUTPUT_WRITE_CURRENT	(0<<24)
-#define TB0A_OUTPUT_WRITE_ACCUM		(1<<24)
-#define TB0A_CTR_STAGE_SEL_BITS_XXX
-#define TB0A_ARG3_SEL_XXX
-#define TB0A_ARG3_INVERT		(1<<17)
-#define TB0A_ARG2_INVERT		(1<<16)
-#define TB0A_ARG2_SEL_ONE		(0 << 12)
-#define TB0A_ARG2_SEL_TEXEL0		(6 << 12)
-#define TB0A_ARG2_SEL_TEXEL1		(7 << 12)
-#define TB0A_ARG2_SEL_TEXEL2		(8 << 12)
-#define TB0A_ARG2_SEL_TEXEL3		(9 << 12)
-#define TB0A_ARG1_INVERT		(1<<10)
-#define TB0A_ARG1_SEL_ONE		(0 << 6)
-#define TB0A_ARG1_SEL_TEXEL0		(6 << 6)
-#define TB0A_ARG1_SEL_TEXEL1		(7 << 6)
-#define TB0A_ARG1_SEL_TEXEL2		(8 << 6)
-#define TB0A_ARG1_SEL_TEXEL3		(9 << 6)
-
-void gen2_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no)
-{
-	static unsigned keep_gpu_busy_counter = 0;
-
-	/* check both edges of the fence usage */
-	if (keep_gpu_busy_counter & 1)
-		keep_gpu_busy();
-
-	/* invariant state */
-	{
-		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(0));
-		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(1));
-		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(2));
-		OUT_BATCH(_3DSTATE_MAP_CUBE | MAP_UNIT(3));
-
-		OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_DFLT_Z_CMD);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_FOG_MODE_CMD);
-		OUT_BATCH(FOGFUNC_ENABLE |
-			  FOG_LINEAR_CONST | FOGSRC_INDEX_Z | ENABLE_FOG_DENSITY);
-		OUT_BATCH(0);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
-			  MAP_UNIT(0) |
-			  DISABLE_TEX_STREAM_BUMP |
-			  ENABLE_TEX_STREAM_COORD_SET |
-			  TEX_STREAM_COORD_SET(0) |
-			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(0));
-		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
-			  MAP_UNIT(1) |
-			  DISABLE_TEX_STREAM_BUMP |
-			  ENABLE_TEX_STREAM_COORD_SET |
-			  TEX_STREAM_COORD_SET(1) |
-			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(1));
-		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
-			  MAP_UNIT(2) |
-			  DISABLE_TEX_STREAM_BUMP |
-			  ENABLE_TEX_STREAM_COORD_SET |
-			  TEX_STREAM_COORD_SET(2) |
-			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(2));
-		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD |
-			  MAP_UNIT(3) |
-			  DISABLE_TEX_STREAM_BUMP |
-			  ENABLE_TEX_STREAM_COORD_SET |
-			  TEX_STREAM_COORD_SET(3) |
-			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(3));
-
-		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
-		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(0));
-		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
-		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(1));
-		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
-		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(2));
-		OUT_BATCH(_3DSTATE_MAP_COORD_TRANSFORM);
-		OUT_BATCH(DISABLE_TEX_TRANSFORM | TEXTURE_SET(3));
-
-		OUT_BATCH(_3DSTATE_RASTER_RULES_CMD |
-			  ENABLE_POINT_RASTER_RULE |
-			  OGL_POINT_RASTER_RULE |
-			  ENABLE_LINE_STRIP_PROVOKE_VRTX |
-			  ENABLE_TRI_FAN_PROVOKE_VRTX |
-			  ENABLE_TRI_STRIP_PROVOKE_VRTX |
-			  LINE_STRIP_PROVOKE_VRTX(1) |
-			  TRI_FAN_PROVOKE_VRTX(2) | TRI_STRIP_PROVOKE_VRTX(2));
-
-		OUT_BATCH(_3DSTATE_SCISSOR_ENABLE_CMD | DISABLE_SCISSOR_RECT);
-
-		OUT_BATCH(_3DSTATE_SCISSOR_RECT_0_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_VERTEX_TRANSFORM);
-		OUT_BATCH(DISABLE_VIEWPORT_TRANSFORM | DISABLE_PERSPECTIVE_DIVIDE);
-
-		OUT_BATCH(_3DSTATE_W_STATE_CMD);
-		OUT_BATCH(MAGIC_W_STATE_DWORD1);
-		OUT_BATCH(0x3f800000 /* 1.0 in IEEE float */ );
-
-		OUT_BATCH(_3DSTATE_COLOR_FACTOR_CMD);
-		OUT_BATCH(0x80808080);	/* .5 required in alpha for GL_DOT3_RGBA_EXT */
-
-		OUT_BATCH(_3DSTATE_MAP_COORD_SETBIND_CMD);
-		OUT_BATCH(TEXBIND_SET3(TEXCOORDSRC_VTXSET_3) |
-			  TEXBIND_SET2(TEXCOORDSRC_VTXSET_2) |
-			  TEXBIND_SET1(TEXCOORDSRC_VTXSET_1) |
-			  TEXBIND_SET0(TEXCOORDSRC_VTXSET_0));
-
-		/* copy from mesa */
-		OUT_BATCH(_3DSTATE_FOG_COLOR_CMD |
-			  FOG_COLOR_RED(0) | FOG_COLOR_GREEN(0) | FOG_COLOR_BLUE(0));
-
-		OUT_BATCH(_3DSTATE_CONST_BLEND_COLOR_CMD);
-		OUT_BATCH(0);
-
-		OUT_BATCH(_3DSTATE_MODES_1_CMD |
-			  ENABLE_COLR_BLND_FUNC |
-			  BLENDFUNC_ADD |
-			  ENABLE_SRC_BLND_FACTOR |
-			  SRC_BLND_FACT(BLENDFACTOR_ONE) |
-			  ENABLE_DST_BLND_FACTOR | DST_BLND_FACT(BLENDFACTOR_ZERO));
-		OUT_BATCH(_3DSTATE_MODES_2_CMD | ENABLE_GLOBAL_DEPTH_BIAS | GLOBAL_DEPTH_BIAS(0) | ENABLE_ALPHA_TEST_FUNC | ALPHA_TEST_FUNC(0) |	/* always */
-			  ALPHA_REF_VALUE(0));
-		OUT_BATCH(_3DSTATE_MODES_3_CMD |
-			  ENABLE_DEPTH_TEST_FUNC |
-			  DEPTH_TEST_FUNC(0x2) |	/* COMPAREFUNC_LESS */
-			  ENABLE_ALPHA_SHADE_MODE |
-			  ALPHA_SHADE_MODE(SHADE_MODE_LINEAR) |
-			  ENABLE_FOG_SHADE_MODE |
-			  FOG_SHADE_MODE(SHADE_MODE_LINEAR) |
-			  ENABLE_SPEC_SHADE_MODE |
-			  SPEC_SHADE_MODE(SHADE_MODE_LINEAR) |
-			  ENABLE_COLOR_SHADE_MODE |
-			  COLOR_SHADE_MODE(SHADE_MODE_LINEAR) |
-			  ENABLE_CULL_MODE | CULLMODE_NONE);
-
-		OUT_BATCH(_3DSTATE_MODES_4_CMD |
-			  ENABLE_LOGIC_OP_FUNC |
-			  LOGIC_OP_FUNC(LOGICOP_COPY) |
-			  ENABLE_STENCIL_TEST_MASK |
-			  STENCIL_TEST_MASK(0xff) |
-			  ENABLE_STENCIL_WRITE_MASK | STENCIL_WRITE_MASK(0xff));
-
-		OUT_BATCH(_3DSTATE_STENCIL_TEST_CMD |
-			  ENABLE_STENCIL_PARMS |
-			  STENCIL_FAIL_OP(0) |	/* STENCILOP_KEEP */
-			  STENCIL_PASS_DEPTH_FAIL_OP(0) |	/* STENCILOP_KEEP */
-			  STENCIL_PASS_DEPTH_PASS_OP(0) |	/* STENCILOP_KEEP */
-			  ENABLE_STENCIL_TEST_FUNC |
-			  STENCIL_TEST_FUNC(0) |	/* COMPAREFUNC_ALWAYS */
-			  ENABLE_STENCIL_REF_VALUE |
-			  STENCIL_REF_VALUE(0));
-
-		OUT_BATCH(_3DSTATE_MODES_5_CMD |
-			  FLUSH_TEXTURE_CACHE |
-			  ENABLE_SPRITE_POINT_TEX | SPRITE_POINT_TEX_OFF |
-			  ENABLE_FIXED_LINE_WIDTH | FIXED_LINE_WIDTH(0x2) | /* 1.0 */
-			  ENABLE_FIXED_POINT_WIDTH | FIXED_POINT_WIDTH(1));
-
-		OUT_BATCH(_3DSTATE_STIPPLE);
-
-		/* Set default blend state */
-		OUT_BATCH(_3DSTATE_MAP_BLEND_OP_CMD(0) |
-			  TEXPIPE_COLOR |
-			  ENABLE_TEXOUTPUT_WRT_SEL |
-			  TEXOP_OUTPUT_CURRENT |
-			  DISABLE_TEX_CNTRL_STAGE |
-			  TEXOP_SCALE_1X |
-			  TEXOP_MODIFY_PARMS | TEXOP_LAST_STAGE | TEXBLENDOP_ARG1);
-		OUT_BATCH(_3DSTATE_MAP_BLEND_OP_CMD(0) |
-			  TEXPIPE_ALPHA |
-			  ENABLE_TEXOUTPUT_WRT_SEL |
-			  TEXOP_OUTPUT_CURRENT |
-			  TEXOP_SCALE_1X | TEXOP_MODIFY_PARMS | TEXBLENDOP_ARG1);
-		OUT_BATCH(_3DSTATE_MAP_BLEND_ARG_CMD(0) |
-			  TEXPIPE_COLOR |
-			  TEXBLEND_ARG1 |
-			  TEXBLENDARG_MODIFY_PARMS | TEXBLENDARG_DIFFUSE);
-		OUT_BATCH(_3DSTATE_MAP_BLEND_ARG_CMD(0) |
-			  TEXPIPE_ALPHA |
-			  TEXBLEND_ARG1 |
-			  TEXBLENDARG_MODIFY_PARMS | TEXBLENDARG_DIFFUSE);
-
-		OUT_BATCH(_3DSTATE_AA_CMD |
-			  AA_LINE_ECAAR_WIDTH_ENABLE |
-			  AA_LINE_ECAAR_WIDTH_1_0 |
-			  AA_LINE_REGION_WIDTH_ENABLE |
-			  AA_LINE_REGION_WIDTH_1_0 | AA_LINE_DISABLE);
-	}
-
-	/* render target state */
-	{
-		uint32_t tiling_bits = 0;
-		if (dst->tiling != I915_TILING_NONE)
-			tiling_bits = BUF_3D_TILED_SURFACE;
-		if (dst->tiling == I915_TILING_Y)
-			tiling_bits |= BUF_3D_TILE_WALK_Y;
-
-		OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
-		OUT_BATCH(BUF_3D_ID_COLOR_BACK | tiling_bits |
-			  BUF_3D_PITCH(dst->stride));
-		OUT_RELOC(dst->bo, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, 0);
-
-		OUT_BATCH(_3DSTATE_DST_BUF_VARS_CMD);
-		OUT_BATCH(COLR_BUF_ARGB8888 |
-			  DSTORG_HORT_BIAS(0x8) |
-			  DSTORG_VERT_BIAS(0x8));
-
-		OUT_BATCH(_3DSTATE_DRAW_RECT_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(0);		/* ymin, xmin */
-		OUT_BATCH(DRAW_YMAX(buf_height(dst) - 1) |
-			  DRAW_XMAX(buf_width(dst) - 1));
-		OUT_BATCH(0);		/* yorig, xorig */
-	}
-
-	/* dynamic state */
-	{
-		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 |
-			  I1_LOAD_S(2) | I1_LOAD_S(3) | I1_LOAD_S(8) | 2);
-		OUT_BATCH(1);		/* number of coordinate sets */
-		OUT_BATCH(S3_CULLMODE_NONE | S3_VERTEXHAS_XY);
-		OUT_BATCH(S8_ENABLE_COLOR_BLEND | S8_BLENDFUNC_ADD |
-			  BLENDFACTOR_ONE << S8_SRC_BLEND_FACTOR_SHIFT |
-			  BLENDFACTOR_ZERO << S8_DST_BLEND_FACTOR_SHIFT |
-			  S8_ENABLE_COLOR_BUFFER_WRITE);
-
-		OUT_BATCH(_3DSTATE_INDPT_ALPHA_BLEND_CMD | DISABLE_INDPT_ALPHA_BLEND);
-
-		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_2 |
-			  LOAD_TEXTURE_BLEND_STAGE(0) | 1);
-		OUT_BATCH(TB0C_LAST_STAGE | TB0C_RESULT_SCALE_1X | TB0C_OP_MODULE |
-			  TB0C_OUTPUT_WRITE_CURRENT | TB0C_ARG1_SEL_TEXEL0 |
-			  TB0C_ARG2_SEL_ONE);
-		OUT_BATCH(TB0A_RESULT_SCALE_1X | TB0A_OP_MODULE |
-			  TB0A_OUTPUT_WRITE_CURRENT | TB0A_ARG1_SEL_TEXEL0 |
-			  TB0A_ARG2_SEL_ONE);
-
-		OUT_BATCH(_3DSTATE_ENABLES_1_CMD | DISABLE_LOGIC_OP |
-			  DISABLE_STENCIL_TEST | DISABLE_DEPTH_BIAS |
-			  DISABLE_SPEC_ADD | DISABLE_FOG | DISABLE_ALPHA_TEST |
-			  ENABLE_COLOR_BLEND | DISABLE_DEPTH_TEST);
-		/* We have to explicitly say we don't want write disabled */
-		OUT_BATCH(_3DSTATE_ENABLES_2_CMD | ENABLE_COLOR_MASK |
-			  DISABLE_STENCIL_WRITE | ENABLE_TEX_CACHE |
-			  DISABLE_DITHER | ENABLE_COLOR_WRITE | DISABLE_DEPTH_WRITE);
-
-		OUT_BATCH(_3DSTATE_VERTEX_FORMAT_2_CMD |
-			  TEXCOORDFMT_2D << 0);
-	}
-
-	/* sampler state */
-	{
-		uint32_t tiling_bits = 0;
-		if (src->tiling != I915_TILING_NONE)
-			tiling_bits = TM0S1_TILED_SURFACE;
-		if (src->tiling == I915_TILING_Y)
-			tiling_bits |= TM0S1_TILE_WALK;
-
-		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_2 |
-			  LOAD_TEXTURE_MAP(0) | 4);
-		OUT_RELOC(src->bo, I915_GEM_DOMAIN_SAMPLER, 0, 0);
-		OUT_BATCH((buf_height(src) - 1) << TM0S1_HEIGHT_SHIFT |
-			  (buf_width(src) - 1) << TM0S1_WIDTH_SHIFT |
-			  MAPSURF_32BIT | MT_32BIT_ARGB8888 | tiling_bits);
-		OUT_BATCH((src->stride / 4 - 1) << TM0S2_PITCH_SHIFT | TM0S2_MAP_2D);
-		OUT_BATCH(FILTER_NEAREST << TM0S3_MAG_FILTER_SHIFT |
-			  FILTER_NEAREST << TM0S3_MIN_FILTER_SHIFT |
-			  MIPFILTER_NONE << TM0S3_MIP_FILTER_SHIFT);
-		OUT_BATCH(0);	/* default color */
-		OUT_BATCH(_3DSTATE_MAP_COORD_SET_CMD | TEXCOORD_SET(0) |
-			  ENABLE_TEXCOORD_PARAMS | TEXCOORDS_ARE_NORMAL |
-			  TEXCOORDTYPE_CARTESIAN |
-			  ENABLE_ADDR_V_CNTL | TEXCOORD_ADDR_V_MODE(TEXCOORDMODE_CLAMP_BORDER) |
-			  ENABLE_ADDR_U_CNTL | TEXCOORD_ADDR_U_MODE(TEXCOORDMODE_CLAMP_BORDER));
-		/* map texel stream */
-		OUT_BATCH(_3DSTATE_MAP_COORD_SETBIND_CMD);
-		OUT_BATCH(TEXBIND_SET0(TEXCOORDSRC_VTXSET_0) |
-			  TEXBIND_SET1(TEXCOORDSRC_KEEP) |
-			  TEXBIND_SET2(TEXCOORDSRC_KEEP) |
-			  TEXBIND_SET3(TEXCOORDSRC_KEEP));
-		OUT_BATCH(_3DSTATE_MAP_TEX_STREAM_CMD | (0 << 16) |
-			  DISABLE_TEX_STREAM_BUMP |
-			  ENABLE_TEX_STREAM_COORD_SET |
-			  TEX_STREAM_COORD_SET(0) |
-			  ENABLE_TEX_STREAM_MAP_IDX | TEX_STREAM_MAP_IDX(0));
-	}
-
-	OUT_BATCH(PRIM3D_INLINE | PRIM3D_RECTLIST | (3*4 -1));
-	emit_vertex(dst_x + options.tile_size);
-	emit_vertex(dst_y + options.tile_size);
-	emit_vertex_normalized(src_x + options.tile_size, buf_width(src));
-	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
-
-	emit_vertex(dst_x);
-	emit_vertex(dst_y + options.tile_size);
-	emit_vertex_normalized(src_x, buf_width(src));
-	emit_vertex_normalized(src_y + options.tile_size, buf_height(src));
-
-	emit_vertex(dst_x);
-	emit_vertex(dst_y);
-	emit_vertex_normalized(src_x, buf_width(src));
-	emit_vertex_normalized(src_y, buf_height(src));
-
-	if (!(keep_gpu_busy_counter & 1))
-		keep_gpu_busy();
-
-	keep_gpu_busy_counter++;
-
-	intel_batchbuffer_flush(batch);
-}
diff --git a/tests/gem_stress_i915.c b/tests/gem_stress_i915.c
deleted file mode 100644
index 396b8d3..0000000
--- a/tests/gem_stress_i915.c
+++ /dev/null
@@ -1,190 +0,0 @@
-#include "i915_reg.h"
-#include "i915_3d.h"
-#include "gem_stress.h"
-
-void gen3_render_copyfunc(struct scratch_buf *src, unsigned src_x, unsigned src_y,
-			  struct scratch_buf *dst, unsigned dst_x, unsigned dst_y,
-			  unsigned logical_tile_no)
-{
-	static unsigned keep_gpu_busy_counter = 0;
-
-	/* check both edges of the fence usage */
-	if (keep_gpu_busy_counter & 1)
-		keep_gpu_busy();
-
-	/* invariant state */
-	{
-		OUT_BATCH(_3DSTATE_AA_CMD |
-			  AA_LINE_ECAAR_WIDTH_ENABLE |
-			  AA_LINE_ECAAR_WIDTH_1_0 |
-			  AA_LINE_REGION_WIDTH_ENABLE | AA_LINE_REGION_WIDTH_1_0);
-		OUT_BATCH(_3DSTATE_INDEPENDENT_ALPHA_BLEND_CMD |
-			  IAB_MODIFY_ENABLE |
-			  IAB_MODIFY_FUNC | (BLENDFUNC_ADD << IAB_FUNC_SHIFT) |
-			  IAB_MODIFY_SRC_FACTOR | (BLENDFACT_ONE <<
-						   IAB_SRC_FACTOR_SHIFT) |
-			  IAB_MODIFY_DST_FACTOR | (BLENDFACT_ZERO <<
-						   IAB_DST_FACTOR_SHIFT));
-		OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(_3DSTATE_DFLT_Z_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(_3DSTATE_COORD_SET_BINDINGS |
-			  CSB_TCB(0, 0) |
-			  CSB_TCB(1, 1) |
-			  CSB_TCB(2, 2) |
-			  CSB_TCB(3, 3) |
-			  CSB_TCB(4, 4) |
-			  CSB_TCB(5, 5) | CSB_TCB(6, 6) | CSB_TCB(7, 7));
-		OUT_BATCH(_3DSTATE_RASTER_RULES_CMD |
-			  ENABLE_POINT_RASTER_RULE |
-			  OGL_POINT_RASTER_RULE |
-			  ENABLE_LINE_STRIP_PROVOKE_VRTX |
-			  ENABLE_TRI_FAN_PROVOKE_VRTX |
-			  LINE_STRIP_PROVOKE_VRTX(1) |
-			  TRI_FAN_PROVOKE_VRTX(2) | ENABLE_TEXKILL_3D_4D | TEXKILL_4D);
-		OUT_BATCH(_3DSTATE_MODES_4_CMD |
-			  ENABLE_LOGIC_OP_FUNC | LOGIC_OP_FUNC(LOGICOP_COPY) |
-			  ENABLE_STENCIL_WRITE_MASK | STENCIL_WRITE_MASK(0xff) |
-			  ENABLE_STENCIL_TEST_MASK | STENCIL_TEST_MASK(0xff));
-		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 | I1_LOAD_S(3) | I1_LOAD_S(4) | I1_LOAD_S(5) | 2);
-		OUT_BATCH(0x00000000);	/* Disable texture coordinate wrap-shortest */
-		OUT_BATCH((1 << S4_POINT_WIDTH_SHIFT) |
-			  S4_LINE_WIDTH_ONE |
-			  S4_CULLMODE_NONE |
-			  S4_VFMT_XY);
-		OUT_BATCH(0x00000000);	/* Stencil. */
-		OUT_BATCH(_3DSTATE_SCISSOR_ENABLE_CMD | DISABLE_SCISSOR_RECT);
-		OUT_BATCH(_3DSTATE_SCISSOR_RECT_0_CMD);
-		OUT_BATCH(0);
-		OUT_BATCH(0);
-		OUT_BATCH(_3DSTATE_DEPTH_SUBRECT_DISABLE);
-		OUT_BATCH(_3DSTATE_LOAD_INDIRECT | 0);	/* disable indirect state */
-		OUT_BATCH(0);
-		OUT_BATCH(_3DSTATE_STIPPLE);
-		OUT_BATCH(0x00000000);
-		OUT_BATCH(_3DSTATE_BACKFACE_STENCIL_OPS | BFO_ENABLE_STENCIL_TWO_SIDE | 0);
-	}
-
-	/* samler state */
-	{
-#define TEX_COUNT 1
-		uint32_t tiling_bits = 0;
-		if (src->tiling != I915_TILING_NONE)
-			tiling_bits = MS3_TILED_SURFACE;
-		if (src->tiling == I915_TILING_Y)
-			tiling_bits |= MS3_TILE_WALK;
-
-		OUT_BATCH(_3DSTATE_MAP_STATE | (3 * TEX_COUNT));
-		OUT_BATCH((1 << TEX_COUNT) - 1);
-		OUT_RELOC(src->bo, I915_GEM_DOMAIN_SAMPLER, 0, 0);
-		OUT_BATCH(MAPSURF_32BIT | MT_32BIT_ARGB8888 |
-			  tiling_bits |
-			  (buf_height(src) - 1) << MS3_HEIGHT_SHIFT |
-			  (buf_width(src) - 1) << MS3_WIDTH_SHIFT);
-		OUT_BATCH((src->stride/4-1) << MS4_PITCH_SHIFT);
-
-		OUT_BATCH(_3DSTATE_SAMPLER_STATE | (3 * TEX_COUNT));
-		OUT_BATCH((1 << TEX_COUNT) - 1);
-		OUT_BATCH(MIPFILTER_NONE << SS2_MIP_FILTER_SHIFT |
-			  FILTER_NEAREST << SS2_MAG_FILTER_SHIFT |
-			  FILTER_NEAREST << SS2_MIN_FILTER_SHIFT);
-		OUT_BATCH(TEXCOORDMODE_WRAP << SS3_TCX_ADDR_MODE_SHIFT |
-			  TEXCOORDMODE_WRAP << SS3_TCY_ADDR_MODE_SHIFT |
-			  0 << SS3_TEXTUREMAP_INDEX_SHIFT);
-		OUT_BATCH(0x00000000);
-	}
-
-	/* render target state */
-	{
-		uint32_t tiling_bits = 0;
-		if (dst->tiling != I915_TILING_NONE)
-			tiling_bits = BUF_3D_TILED_SURFACE;
-		if (dst->tiling == I915_TILING_Y)
-			tiling_bits |= BUF_3D_TILE_WALK_Y;
-
-		OUT_BATCH(_3DSTATE_BUF_INFO_CMD);
-		OUT_BATCH(BUF_3D_ID_COLOR_BACK | tiling_bits |
-			  BUF_3D_PITCH(dst->stride));
-		OUT_RELOC(dst->bo, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, 0);
-
-		OUT_BATCH(_3DSTATE_DST_BUF_VARS_CMD);
-		OUT_BATCH(COLR_BUF_ARGB8888 |
-			  DSTORG_HORT_BIAS(0x8) |
-			  DSTORG_VERT_BIAS(0x8));
-
-		/* draw rect is unconditional */
-		OUT_BATCH(_3DSTATE_DRAW_RECT_CMD);
-		OUT_BATCH(0x00000000);
-		OUT_BATCH(0x00000000);	/* ymin, xmin */
-		OUT_BATCH(DRAW_YMAX(buf_height(dst) - 1) |
-			  DRAW_XMAX(buf_width(dst) - 1));
-		/* yorig, xorig (relate to color buffer?) */
-		OUT_BATCH(0x00000000);
-	}
-
-	/* texfmt */
-	{
-		OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1 |
-			  I1_LOAD_S(1) | I1_LOAD_S(2) | I1_LOAD_S(6) | 2);
-		OUT_BATCH((4 << S1_VERTEX_WIDTH_SHIFT) |
-			  (4 << S1_VERTEX_PITCH_SHIFT));
-		OUT_BATCH(~S2_TEXCOORD_FMT(0, TEXCOORDFMT_NOT_PRESENT) | S2_TEXCOORD_FMT(0, TEXCOORDFMT_2D));
-		OUT_BATCH(S6_CBUF_BLEND_ENABLE | S6_COLOR_WRITE_ENABLE |
-			  BLENDFUNC_ADD << S6_CBUF_BLEND_FUNC_SHIFT |
-			  BLENDFACT_ONE << S6_CBUF_SRC_BLEND_FACT_SHIFT |
-			  BLENDFACT_ZERO << S6_CBUF_DST_BLEND_FACT_SHIFT);
-	}
-
-	/* frage shader */
-	{
-		OUT_BATCH(_3DSTATE_PIXEL_SHADER_PROGRAM | (1 + 3*3 - 2));
-		/* decl FS_T0 */
-		OUT_BATCH(D0_DCL |
-			  REG_TYPE(FS_T0) << D0_TYPE_SHIFT |
-			  REG_NR(FS_T0) << D0_NR_SHIFT |
-			  ((REG_TYPE(FS_T0) != REG_TYPE_S) ? D0_CHANNEL_ALL : 0));
-		OUT_BATCH(0);
-		OUT_BATCH(0);
-		/* decl FS_S0 */
-		OUT_BATCH(D0_DCL |
-			  (REG_TYPE(FS_S0) << D0_TYPE_SHIFT) |
-			  (REG_NR(FS_S0) << D0_NR_SHIFT) |
-			  ((REG_TYPE(FS_S0) != REG_TYPE_S) ? D0_CHANNEL_ALL : 0));
-		OUT_BATCH(0);
-		OUT_BATCH(0);
-		/* texld(FS_OC, FS_S0, FS_T0 */
-		OUT_BATCH(T0_TEXLD |
-			  (REG_TYPE(FS_OC) << T0_DEST_TYPE_SHIFT) |
-			  (REG_NR(FS_OC) << T0_DEST_NR_SHIFT) |
-			  (REG_NR(FS_S0) << T0_SAMPLER_NR_SHIFT));
-		OUT_BATCH((REG_TYPE(FS_T0) << T1_ADDRESS_REG_TYPE_SHIFT) |
-			  (REG_NR(FS_T0) << T1_ADDRESS_REG_NR_SHIFT));
-		OUT_BATCH(0);
-	}
-
-	OUT_BATCH(PRIM3D_RECTLIST | (3*4 - 1));
-	emit_vertex(dst_x + options.tile_size);
-	emit_vertex(dst_y + options.tile_size);
-	emit_vertex(src_x + options.tile_size);
-	emit_vertex(src_y + options.tile_size);
-
-	emit_vertex(dst_x);
-	emit_vertex(dst_y + options.tile_size);
-	emit_vertex(src_x);
-	emit_vertex(src_y + options.tile_size);
-
-	emit_vertex(dst_x);
-	emit_vertex(dst_y);
-	emit_vertex(src_x);
-	emit_vertex(src_y);
-
-	if (!(keep_gpu_busy_counter & 1))
-		keep_gpu_busy();
-
-	keep_gpu_busy_counter++;
-
-	intel_batchbuffer_flush(batch);
-}
diff --git a/tests/gen6_render.h b/tests/gen6_render.h
deleted file mode 100644
index 2c63c9e..0000000
--- a/tests/gen6_render.h
+++ /dev/null
@@ -1,1553 +0,0 @@
-#ifndef GEN6_RENDER_H
-#define GEN6_RENDER_H
-
-#define GEN6_3D(Pipeline,Opcode,Subopcode) ((3 << 29) | \
-					   ((Pipeline) << 27) | \
-					   ((Opcode) << 24) | \
-					   ((Subopcode) << 16))
-
-#define GEN6_STATE_BASE_ADDRESS			GEN6_3D(0, 1, 1)
-#define GEN6_STATE_SIP				GEN6_3D(0, 1, 2)
-
-#define GEN6_PIPELINE_SELECT			GEN6_3D(1, 1, 4)
-
-#define GEN6_MEDIA_STATE_POINTERS		GEN6_3D(2, 0, 0)
-#define GEN6_MEDIA_OBJECT			GEN6_3D(2, 1, 0)
-
-#define GEN6_3DSTATE_BINDING_TABLE_POINTERS	GEN6_3D(3, 0, 1)
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS  (1 << 12)/* for GEN6 */
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_GS  (1 << 9) /* for GEN6 */
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_VS  (1 << 8) /* for GEN6 */
-
-#define GEN6_3DSTATE_VERTEX_BUFFERS		GEN6_3D(3, 0, 8)
-#define GEN6_3DSTATE_VERTEX_ELEMENTS		GEN6_3D(3, 0, 9)
-#define GEN6_3DSTATE_INDEX_BUFFER		GEN6_3D(3, 0, 0xa)
-#define GEN6_3DSTATE_VF_STATISTICS		GEN6_3D(3, 0, 0xb)
-
-#define GEN6_3DSTATE_DRAWING_RECTANGLE		GEN6_3D(3, 1, 0)
-#define GEN6_3DSTATE_CONSTANT_COLOR		GEN6_3D(3, 1, 1)
-#define GEN6_3DSTATE_SAMPLER_PALETTE_LOAD	GEN6_3D(3, 1, 2)
-#define GEN6_3DSTATE_CHROMA_KEY			GEN6_3D(3, 1, 4)
-#define GEN6_3DSTATE_DEPTH_BUFFER		GEN6_3D(3, 1, 5)
-# define GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT	29
-# define GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT	18
-
-#define GEN6_3DSTATE_POLY_STIPPLE_OFFSET		GEN6_3D(3, 1, 6)
-#define GEN6_3DSTATE_POLY_STIPPLE_PATTERN	GEN6_3D(3, 1, 7)
-#define GEN6_3DSTATE_LINE_STIPPLE		GEN6_3D(3, 1, 8)
-#define GEN6_3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP	GEN6_3D(3, 1, 9)
-/* These two are BLC and CTG only, not BW or CL */
-#define GEN6_3DSTATE_AA_LINE_PARAMS		GEN6_3D(3, 1, 0xa)
-#define GEN6_3DSTATE_GS_SVB_INDEX		GEN6_3D(3, 1, 0xb)
-
-#define GEN6_3DPRIMITIVE				GEN6_3D(3, 3, 0)
-
-#define GEN6_3DSTATE_CLEAR_PARAMS		GEN6_3D(3, 1, 0x10)
-/* DW1 */
-# define GEN6_3DSTATE_DEPTH_CLEAR_VALID		(1 << 15)
-
-#define GEN6_3DSTATE_SAMPLER_STATE_POINTERS	GEN6_3D(3, 0, 0x02)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS	(1 << 12)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_GS	(1 << 9)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_VS	(1 << 8)
-
-#define GEN6_3DSTATE_URB			GEN6_3D(3, 0, 0x05)
-/* DW1 */
-# define GEN6_3DSTATE_URB_VS_SIZE_SHIFT		16
-# define GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT	0
-/* DW2 */
-# define GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT	8
-# define GEN6_3DSTATE_URB_GS_SIZE_SHIFT		0
-
-#define GEN6_3DSTATE_VIEWPORT_STATE_POINTERS	GEN6_3D(3, 0, 0x0d)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC		(1 << 12)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_SF		(1 << 11)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CLIP	(1 << 10)
-
-#define GEN6_3DSTATE_CC_STATE_POINTERS		GEN6_3D(3, 0, 0x0e)
-
-#define GEN6_3DSTATE_VS				GEN6_3D(3, 0, 0x10)
-
-#define GEN6_3DSTATE_GS				GEN6_3D(3, 0, 0x11)
-/* DW4 */
-# define GEN6_3DSTATE_GS_DISPATCH_START_GRF_SHIFT	0
-
-#define GEN6_3DSTATE_CLIP			GEN6_3D(3, 0, 0x12)
-
-#define GEN6_3DSTATE_SF				GEN6_3D(3, 0, 0x13)
-/* DW1 */
-# define GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT		22
-# define GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT	11
-# define GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT	4
-/* DW2 */
-/* DW3 */
-# define GEN6_3DSTATE_SF_CULL_BOTH			(0 << 29)
-# define GEN6_3DSTATE_SF_CULL_NONE			(1 << 29)
-# define GEN6_3DSTATE_SF_CULL_FRONT			(2 << 29)
-# define GEN6_3DSTATE_SF_CULL_BACK			(3 << 29)
-/* DW4 */
-# define GEN6_3DSTATE_SF_TRI_PROVOKE_SHIFT		29
-# define GEN6_3DSTATE_SF_LINE_PROVOKE_SHIFT		27
-# define GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT		25
-
-#define GEN6_3DSTATE_WM				GEN6_3D(3, 0, 0x14)
-/* DW2 */
-# define GEN6_3DSTATE_WM_SAMPLER_COUNT_SHIFT			27
-# define GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT	18
-/* DW4 */
-# define GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT		16
-/* DW5 */
-# define GEN6_3DSTATE_WM_MAX_THREADS_SHIFT			25
-# define GEN6_3DSTATE_WM_DISPATCH_ENABLE			(1 << 19)
-# define GEN6_3DSTATE_WM_16_DISPATCH_ENABLE			(1 << 1)
-# define GEN6_3DSTATE_WM_8_DISPATCH_ENABLE			(1 << 0)
-/* DW6 */
-# define GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT			20
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC	(1 << 15)
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 14)
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC	(1 << 13)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC		(1 << 12)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 11)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC		(1 << 10)
-
-
-#define GEN6_3DSTATE_CONSTANT_VS		GEN6_3D(3, 0, 0x15)
-#define GEN6_3DSTATE_CONSTANT_GS		GEN6_3D(3, 0, 0x16)
-#define GEN6_3DSTATE_CONSTANT_PS		GEN6_3D(3, 0, 0x17)
-
-#define GEN6_3DSTATE_SAMPLE_MASK		GEN6_3D(3, 0, 0x18)
-
-#define GEN6_3DSTATE_MULTISAMPLE		GEN6_3D(3, 1, 0x0d)
-/* DW1 */
-# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER		(0 << 4)
-# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_UPPER_LEFT	(1 << 4)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1			(0 << 1)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_4			(2 << 1)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_8			(3 << 1)
-
-#define PIPELINE_SELECT_3D		0
-#define PIPELINE_SELECT_MEDIA		1
-
-/* for GEN6_STATE_BASE_ADDRESS */
-#define BASE_ADDRESS_MODIFY		(1 << 0)
-
-/* for GEN6_PIPE_CONTROL */
-#define GEN6_PIPE_CONTROL_NOWRITE       (0 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_QWORD   (1 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_DEPTH   (2 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_TIME    (3 << 14)
-#define GEN6_PIPE_CONTROL_DEPTH_STALL   (1 << 13)
-#define GEN6_PIPE_CONTROL_WC_FLUSH      (1 << 12)
-#define GEN6_PIPE_CONTROL_IS_FLUSH      (1 << 11)
-#define GEN6_PIPE_CONTROL_TC_FLUSH      (1 << 10)
-#define GEN6_PIPE_CONTROL_NOTIFY_ENABLE (1 << 8)
-#define GEN6_PIPE_CONTROL_GLOBAL_GTT    (1 << 2)
-#define GEN6_PIPE_CONTROL_LOCAL_PGTT    (0 << 2)
-#define GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH	(1 << 0)
-
-/* VERTEX_BUFFER_STATE Structure */
-#define VB0_BUFFER_INDEX_SHIFT	26
-#define VB0_VERTEXDATA			(0 << 20)
-#define VB0_INSTANCEDATA		(1 << 20)
-#define VB0_BUFFER_PITCH_SHIFT		0
-
-/* VERTEX_ELEMENT_STATE Structure */
-#define VE0_VERTEX_BUFFER_INDEX_SHIFT	26 /* for GEN6 */
-#define VE0_VALID			(1 << 25) /* for GEN6 */
-#define VE0_FORMAT_SHIFT		16
-#define VE0_OFFSET_SHIFT		0
-#define VE1_VFCOMPONENT_0_SHIFT		28
-#define VE1_VFCOMPONENT_1_SHIFT		24
-#define VE1_VFCOMPONENT_2_SHIFT		20
-#define VE1_VFCOMPONENT_3_SHIFT		16
-#define VE1_DESTINATION_ELEMENT_OFFSET_SHIFT	0
-
-/* 3DPRIMITIVE bits */
-#define GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL (0 << 15)
-#define GEN6_3DPRIMITIVE_VERTEX_RANDOM	  (1 << 15)
-/* Primitive types are in gen6_defines.h */
-#define GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT	  10
-
-#define GEN6_SVG_CTL		       0x7400
-
-#define GEN6_SVG_CTL_GS_BA	       (0 << 8)
-#define GEN6_SVG_CTL_SS_BA	       (1 << 8)
-#define GEN6_SVG_CTL_IO_BA	       (2 << 8)
-#define GEN6_SVG_CTL_GS_AUB	       (3 << 8)
-#define GEN6_SVG_CTL_IO_AUB	       (4 << 8)
-#define GEN6_SVG_CTL_SIP		       (5 << 8)
-
-#define GEN6_SVG_RDATA		       0x7404
-#define GEN6_SVG_WORK_CTL	       0x7408
-
-#define GEN6_VF_CTL		       0x7500
-
-#define GEN6_VF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_THREADID	   (0 << 8)
-#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_VF_DEBUG	   (1 << 8)
-#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_SEQUENCE   (0 << 4)
-#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_INDEX	   (1 << 4)
-#define GEN6_VF_CTL_SKIP_INITIAL_PRIMITIVES	   (1 << 3)
-#define GEN6_VF_CTL_MAX_PRIMITIVES_LIMIT_ENABLE	   (1 << 2)
-#define GEN6_VF_CTL_VERTEX_RANGE_LIMIT_ENABLE	   (1 << 1)
-#define GEN6_VF_CTL_SNAPSHOT_ENABLE	     	   (1 << 0)
-
-#define GEN6_VF_STRG_VAL		       0x7504
-#define GEN6_VF_STR_VL_OVR	       0x7508
-#define GEN6_VF_VC_OVR		       0x750c
-#define GEN6_VF_STR_PSKIP	       0x7510
-#define GEN6_VF_MAX_PRIM		       0x7514
-#define GEN6_VF_RDATA		       0x7518
-
-#define GEN6_VS_CTL		       0x7600
-#define GEN6_VS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_0	   (0 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_1	   (1 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VALID_COUNT	   (2 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VS_KERNEL_POINTER  (3 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
-#define GEN6_VS_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
-#define GEN6_VS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_VS_STRG_VAL		       0x7604
-#define GEN6_VS_RDATA		       0x7608
-
-#define GEN6_SF_CTL		       0x7b00
-#define GEN6_SF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_FF_ID	   (0 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_REL_COUNT (1 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_FF_ID	   (2 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_REL_COUNT (3 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_FF_ID	   (4 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_REL_COUNT (5 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_COUNT	   (6 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_SF_KERNEL_POINTER  (7 << 8)
-#define GEN6_SF_CTL_MIN_MAX_PRIMITIVE_RANGE_ENABLE  (1 << 4)
-#define GEN6_SF_CTL_DEBUG_CLIP_RECTANGLE_ENABLE	   (1 << 3)
-#define GEN6_SF_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
-#define GEN6_SF_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
-#define GEN6_SF_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_SF_STRG_VAL		       0x7b04
-#define GEN6_SF_RDATA		       0x7b18
-
-#define GEN6_WIZ_CTL		       0x7c00
-#define GEN6_WIZ_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_WIZ_CTL_SUBSPAN_INSTANCE_SHIFT	   16
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_WIZ_KERNEL_POINTER   (0 << 8)
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_SUBSPAN_INSTANCE     (1 << 8)
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_PRIMITIVE_SEQUENCE   (2 << 8)
-#define GEN6_WIZ_CTL_SINGLE_SUBSPAN_DISPATCH	      (1 << 6)
-#define GEN6_WIZ_CTL_IGNORE_COLOR_SCOREBOARD_STALLS    (1 << 5)
-#define GEN6_WIZ_CTL_ENABLE_SUBSPAN_INSTANCE_COMPARE   (1 << 4)
-#define GEN6_WIZ_CTL_USE_UPSTREAM_SNAPSHOT_FLAG	      (1 << 3)
-#define GEN6_WIZ_CTL_SNAPSHOT_ALL_THREADS	      (1 << 2)
-#define GEN6_WIZ_CTL_THREAD_SNAPSHOT_ENABLE	      (1 << 1)
-#define GEN6_WIZ_CTL_SNAPSHOT_ENABLE		      (1 << 0)
-
-#define GEN6_WIZ_STRG_VAL			      0x7c04
-#define GEN6_WIZ_RDATA				      0x7c18
-
-#define GEN6_TS_CTL		       0x7e00
-#define GEN6_TS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_TS_CTL_SNAPSHOT_MESSAGE_ERROR	   (0 << 8)
-#define GEN6_TS_CTL_SNAPSHOT_INTERFACE_DESCRIPTOR   (3 << 8)
-#define GEN6_TS_CTL_SNAPSHOT_ALL_CHILD_THREADS	   (1 << 2)
-#define GEN6_TS_CTL_SNAPSHOT_ALL_ROOT_THREADS  	   (1 << 1)
-#define GEN6_TS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_TS_STRG_VAL		       0x7e04
-#define GEN6_TS_RDATA		       0x7e08
-
-/* TD_CTL on gen6 is 0x7000, to not break stuff which depends on this... */
-#ifndef GEN6_TD_CTL
-#define GEN6_TD_CTL		       0x8000
-#endif
-#define GEN6_TD_CTL_MUX_SHIFT	       8
-#define GEN6_TD_CTL_EXTERNAL_HALT_R0_DEBUG_MATCH	   (1 << 7)
-#define GEN6_TD_CTL_FORCE_EXTERNAL_HALT		   (1 << 6)
-#define GEN6_TD_CTL_EXCEPTION_MASK_OVERRIDE	   (1 << 5)
-#define GEN6_TD_CTL_FORCE_THREAD_BREAKPOINT_ENABLE  (1 << 4)
-#define GEN6_TD_CTL_BREAKPOINT_ENABLE		   (1 << 2)
-#define GEN6_TD_CTL2		       0x8004
-#define GEN6_TD_CTL2_ILLEGAL_OPCODE_EXCEPTION_OVERRIDE (1 << 28)
-#define GEN6_TD_CTL2_MASKSTACK_EXCEPTION_OVERRIDE      (1 << 26)
-#define GEN6_TD_CTL2_SOFTWARE_EXCEPTION_OVERRIDE	      (1 << 25)
-#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_SHIFT	      16
-#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_ENABLE	      (1 << 8)
-#define GEN6_TD_CTL2_THREAD_SPAWNER_EXECUTION_MASK_ENABLE (1 << 7)
-#define GEN6_TD_CTL2_WIZ_EXECUTION_MASK_ENABLE	      (1 << 6)
-#define GEN6_TD_CTL2_SF_EXECUTION_MASK_ENABLE	      (1 << 5)
-#define GEN6_TD_CTL2_CLIPPER_EXECUTION_MASK_ENABLE     (1 << 4)
-#define GEN6_TD_CTL2_GS_EXECUTION_MASK_ENABLE	      (1 << 3)
-#define GEN6_TD_CTL2_VS_EXECUTION_MASK_ENABLE	      (1 << 0)
-#define GEN6_TD_VF_VS_EMSK	       0x8008
-#define GEN6_TD_GS_EMSK		       0x800c
-#define GEN6_TD_CLIP_EMSK	       0x8010
-#define GEN6_TD_SF_EMSK		       0x8014
-#define GEN6_TD_WIZ_EMSK		       0x8018
-#define GEN6_TD_0_6_EHTRG_VAL	       0x801c
-#define GEN6_TD_0_7_EHTRG_VAL	       0x8020
-#define GEN6_TD_0_6_EHTRG_MSK           0x8024
-#define GEN6_TD_0_7_EHTRG_MSK	       0x8028
-#define GEN6_TD_RDATA		       0x802c
-#define GEN6_TD_TS_EMSK		       0x8030
-
-#define GEN6_EU_CTL		       0x8800
-#define GEN6_EU_CTL_SELECT_SHIFT	       16
-#define GEN6_EU_CTL_DATA_MUX_SHIFT      8
-#define GEN6_EU_ATT_0		       0x8810
-#define GEN6_EU_ATT_1		       0x8814
-#define GEN6_EU_ATT_DATA_0	       0x8820
-#define GEN6_EU_ATT_DATA_1	       0x8824
-#define GEN6_EU_ATT_CLR_0	       0x8830
-#define GEN6_EU_ATT_CLR_1	       0x8834
-#define GEN6_EU_RDATA		       0x8840
-
-#define GEN6_3D(Pipeline,Opcode,Subopcode) ((3 << 29) | \
-					   ((Pipeline) << 27) | \
-					   ((Opcode) << 24) | \
-					   ((Subopcode) << 16))
-
-#define GEN6_STATE_BASE_ADDRESS			GEN6_3D(0, 1, 1)
-#define GEN6_STATE_SIP				GEN6_3D(0, 1, 2)
-
-#define GEN6_PIPELINE_SELECT			GEN6_3D(1, 1, 4)
-
-#define GEN6_MEDIA_STATE_POINTERS		GEN6_3D(2, 0, 0)
-#define GEN6_MEDIA_OBJECT			GEN6_3D(2, 1, 0)
-
-#define GEN6_3DSTATE_BINDING_TABLE_POINTERS	GEN6_3D(3, 0, 1)
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_PS  (1 << 12)/* for GEN6 */
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_GS  (1 << 9) /* for GEN6 */
-# define GEN6_3DSTATE_BINDING_TABLE_MODIFY_VS  (1 << 8) /* for GEN6 */
-
-#define GEN6_3DSTATE_VERTEX_BUFFERS		GEN6_3D(3, 0, 8)
-#define GEN6_3DSTATE_VERTEX_ELEMENTS		GEN6_3D(3, 0, 9)
-#define GEN6_3DSTATE_INDEX_BUFFER		GEN6_3D(3, 0, 0xa)
-#define GEN6_3DSTATE_VF_STATISTICS		GEN6_3D(3, 0, 0xb)
-
-#define GEN6_3DSTATE_DRAWING_RECTANGLE		GEN6_3D(3, 1, 0)
-#define GEN6_3DSTATE_CONSTANT_COLOR		GEN6_3D(3, 1, 1)
-#define GEN6_3DSTATE_SAMPLER_PALETTE_LOAD	GEN6_3D(3, 1, 2)
-#define GEN6_3DSTATE_CHROMA_KEY			GEN6_3D(3, 1, 4)
-#define GEN6_3DSTATE_DEPTH_BUFFER		GEN6_3D(3, 1, 5)
-# define GEN6_3DSTATE_DEPTH_BUFFER_TYPE_SHIFT	29
-# define GEN6_3DSTATE_DEPTH_BUFFER_FORMAT_SHIFT	18
-
-#define GEN6_3DSTATE_POLY_STIPPLE_OFFSET		GEN6_3D(3, 1, 6)
-#define GEN6_3DSTATE_POLY_STIPPLE_PATTERN	GEN6_3D(3, 1, 7)
-#define GEN6_3DSTATE_LINE_STIPPLE		GEN6_3D(3, 1, 8)
-#define GEN6_3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP	GEN6_3D(3, 1, 9)
-/* These two are BLC and CTG only, not BW or CL */
-#define GEN6_3DSTATE_AA_LINE_PARAMS		GEN6_3D(3, 1, 0xa)
-#define GEN6_3DSTATE_GS_SVB_INDEX		GEN6_3D(3, 1, 0xb)
-
-#define GEN6_PIPE_CONTROL			GEN6_3D(3, 2, 0)
-
-#define GEN6_3DPRIMITIVE				GEN6_3D(3, 3, 0)
-
-#define GEN6_3DSTATE_CLEAR_PARAMS		GEN6_3D(3, 1, 0x10)
-/* DW1 */
-# define GEN6_3DSTATE_DEPTH_CLEAR_VALID		(1 << 15)
-
-/* for GEN6+ */
-#define GEN6_3DSTATE_SAMPLER_STATE_POINTERS	GEN6_3D(3, 0, 0x02)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_PS	(1 << 12)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_GS	(1 << 9)
-# define GEN6_3DSTATE_SAMPLER_STATE_MODIFY_VS	(1 << 8)
-
-#define GEN6_3DSTATE_URB			GEN6_3D(3, 0, 0x05)
-/* DW1 */
-# define GEN6_3DSTATE_URB_VS_SIZE_SHIFT		16
-# define GEN6_3DSTATE_URB_VS_ENTRIES_SHIFT	0
-/* DW2 */
-# define GEN6_3DSTATE_URB_GS_ENTRIES_SHIFT	8
-# define GEN6_3DSTATE_URB_GS_SIZE_SHIFT		0
-
-#define GEN6_3DSTATE_VIEWPORT_STATE_POINTERS	GEN6_3D(3, 0, 0x0d)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CC		(1 << 12)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_SF		(1 << 11)
-# define GEN6_3DSTATE_VIEWPORT_STATE_MODIFY_CLIP	(1 << 10)
-
-#define GEN6_3DSTATE_CC_STATE_POINTERS		GEN6_3D(3, 0, 0x0e)
-
-#define GEN6_3DSTATE_VS				GEN6_3D(3, 0, 0x10)
-
-#define GEN6_3DSTATE_GS				GEN6_3D(3, 0, 0x11)
-/* DW4 */
-# define GEN6_3DSTATE_GS_DISPATCH_START_GRF_SHIFT	0
-
-#define GEN6_3DSTATE_CLIP			GEN6_3D(3, 0, 0x12)
-
-#define GEN6_3DSTATE_SF				GEN6_3D(3, 0, 0x13)
-/* DW1 */
-# define GEN6_3DSTATE_SF_NUM_OUTPUTS_SHIFT		22
-# define GEN6_3DSTATE_SF_URB_ENTRY_READ_LENGTH_SHIFT	11
-# define GEN6_3DSTATE_SF_URB_ENTRY_READ_OFFSET_SHIFT	4
-/* DW2 */
-/* DW3 */
-# define GEN6_3DSTATE_SF_CULL_BOTH			(0 << 29)
-# define GEN6_3DSTATE_SF_CULL_NONE			(1 << 29)
-# define GEN6_3DSTATE_SF_CULL_FRONT			(2 << 29)
-# define GEN6_3DSTATE_SF_CULL_BACK			(3 << 29)
-/* DW4 */
-# define GEN6_3DSTATE_SF_TRI_PROVOKE_SHIFT		29
-# define GEN6_3DSTATE_SF_LINE_PROVOKE_SHIFT		27
-# define GEN6_3DSTATE_SF_TRIFAN_PROVOKE_SHIFT		25
-
-
-#define GEN6_3DSTATE_WM				GEN6_3D(3, 0, 0x14)
-/* DW2 */
-# define GEN6_3DSTATE_WM_SAMPLER_COUNT_SHITF			27
-# define GEN6_3DSTATE_WM_BINDING_TABLE_ENTRY_COUNT_SHIFT	18
-/* DW4 */
-# define GEN6_3DSTATE_WM_DISPATCH_START_GRF_0_SHIFT		16
-/* DW5 */
-# define GEN6_3DSTATE_WM_MAX_THREADS_SHIFT			25
-# define GEN6_3DSTATE_WM_DISPATCH_ENABLE			(1 << 19)
-# define GEN6_3DSTATE_WM_16_DISPATCH_ENABLE			(1 << 1)
-# define GEN6_3DSTATE_WM_8_DISPATCH_ENABLE			(1 << 0)
-/* DW6 */
-# define GEN6_3DSTATE_WM_NUM_SF_OUTPUTS_SHIFT			20
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_SAMPLE_BARYCENTRIC	(1 << 15)
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 14)
-# define GEN6_3DSTATE_WM_NONPERSPECTIVE_PIXEL_BARYCENTRIC	(1 << 13)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_SAMPLE_BARYCENTRIC		(1 << 12)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_CENTROID_BARYCENTRIC	(1 << 11)
-# define GEN6_3DSTATE_WM_PERSPECTIVE_PIXEL_BARYCENTRIC		(1 << 10)
-
-
-#define GEN6_3DSTATE_CONSTANT_VS		GEN6_3D(3, 0, 0x15)
-#define GEN6_3DSTATE_CONSTANT_GS          	GEN6_3D(3, 0, 0x16)
-#define GEN6_3DSTATE_CONSTANT_PS          	GEN6_3D(3, 0, 0x17)
-
-#define GEN6_3DSTATE_SAMPLE_MASK		GEN6_3D(3, 0, 0x18)
-
-#define GEN6_3DSTATE_MULTISAMPLE		GEN6_3D(3, 1, 0x0d)
-/* DW1 */
-# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_CENTER		(0 << 4)
-# define GEN6_3DSTATE_MULTISAMPLE_PIXEL_LOCATION_UPPER_LEFT	(1 << 4)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_1			(0 << 1)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_4			(2 << 1)
-# define GEN6_3DSTATE_MULTISAMPLE_NUMSAMPLES_8			(3 << 1)
-
-#define PIPELINE_SELECT_3D		0
-#define PIPELINE_SELECT_MEDIA		1
-
-#define UF0_CS_REALLOC			(1 << 13)
-#define UF0_VFE_REALLOC			(1 << 12)
-#define UF0_SF_REALLOC			(1 << 11)
-#define UF0_CLIP_REALLOC		(1 << 10)
-#define UF0_GS_REALLOC			(1 << 9)
-#define UF0_VS_REALLOC			(1 << 8)
-#define UF1_CLIP_FENCE_SHIFT		20
-#define UF1_GS_FENCE_SHIFT		10
-#define UF1_VS_FENCE_SHIFT		0
-#define UF2_CS_FENCE_SHIFT		20
-#define UF2_VFE_FENCE_SHIFT		10
-#define UF2_SF_FENCE_SHIFT		0
-
-/* for GEN6_STATE_BASE_ADDRESS */
-#define BASE_ADDRESS_MODIFY		(1 << 0)
-
-/* for GEN6_3DSTATE_PIPELINED_POINTERS */
-#define GEN6_GS_DISABLE		       0
-#define GEN6_GS_ENABLE		       1
-#define GEN6_CLIP_DISABLE	       0
-#define GEN6_CLIP_ENABLE		       1
-
-/* for GEN6_PIPE_CONTROL */
-#define GEN6_PIPE_CONTROL_NOWRITE       (0 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_QWORD   (1 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_DEPTH   (2 << 14)
-#define GEN6_PIPE_CONTROL_WRITE_TIME    (3 << 14)
-#define GEN6_PIPE_CONTROL_DEPTH_STALL   (1 << 13)
-#define GEN6_PIPE_CONTROL_WC_FLUSH      (1 << 12)
-#define GEN6_PIPE_CONTROL_IS_FLUSH      (1 << 11)
-#define GEN6_PIPE_CONTROL_TC_FLUSH      (1 << 10)
-#define GEN6_PIPE_CONTROL_NOTIFY_ENABLE (1 << 8)
-#define GEN6_PIPE_CONTROL_GLOBAL_GTT    (1 << 2)
-#define GEN6_PIPE_CONTROL_LOCAL_PGTT    (0 << 2)
-#define GEN6_PIPE_CONTROL_DEPTH_CACHE_FLUSH	(1 << 0)
-
-/* 3DPRIMITIVE bits */
-#define GEN6_3DPRIMITIVE_VERTEX_SEQUENTIAL (0 << 15)
-#define GEN6_3DPRIMITIVE_VERTEX_RANDOM	  (1 << 15)
-/* Primitive types are in gen6_defines.h */
-#define GEN6_3DPRIMITIVE_TOPOLOGY_SHIFT	  10
-
-#define GEN6_SVG_CTL		       0x7400
-
-#define GEN6_SVG_CTL_GS_BA	       (0 << 8)
-#define GEN6_SVG_CTL_SS_BA	       (1 << 8)
-#define GEN6_SVG_CTL_IO_BA	       (2 << 8)
-#define GEN6_SVG_CTL_GS_AUB	       (3 << 8)
-#define GEN6_SVG_CTL_IO_AUB	       (4 << 8)
-#define GEN6_SVG_CTL_SIP		       (5 << 8)
-
-#define GEN6_SVG_RDATA		       0x7404
-#define GEN6_SVG_WORK_CTL	       0x7408
-
-#define GEN6_VF_CTL		       0x7500
-
-#define GEN6_VF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_THREADID	   (0 << 8)
-#define GEN6_VF_CTL_SNAPSHOT_MUX_SELECT_VF_DEBUG	   (1 << 8)
-#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_SEQUENCE   (0 << 4)
-#define GEN6_VF_CTL_SNAPSHOT_TYPE_VERTEX_INDEX	   (1 << 4)
-#define GEN6_VF_CTL_SKIP_INITIAL_PRIMITIVES	   (1 << 3)
-#define GEN6_VF_CTL_MAX_PRIMITIVES_LIMIT_ENABLE	   (1 << 2)
-#define GEN6_VF_CTL_VERTEX_RANGE_LIMIT_ENABLE	   (1 << 1)
-#define GEN6_VF_CTL_SNAPSHOT_ENABLE	     	   (1 << 0)
-
-#define GEN6_VF_STRG_VAL		       0x7504
-#define GEN6_VF_STR_VL_OVR	       0x7508
-#define GEN6_VF_VC_OVR		       0x750c
-#define GEN6_VF_STR_PSKIP	       0x7510
-#define GEN6_VF_MAX_PRIM		       0x7514
-#define GEN6_VF_RDATA		       0x7518
-
-#define GEN6_VS_CTL		       0x7600
-#define GEN6_VS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_0	   (0 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VERTEX_1	   (1 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VALID_COUNT	   (2 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_MUX_VS_KERNEL_POINTER  (3 << 8)
-#define GEN6_VS_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
-#define GEN6_VS_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
-#define GEN6_VS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_VS_STRG_VAL		       0x7604
-#define GEN6_VS_RDATA		       0x7608
-
-#define GEN6_SF_CTL		       0x7b00
-#define GEN6_SF_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_FF_ID	   (0 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_0_REL_COUNT (1 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_FF_ID	   (2 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_1_REL_COUNT (3 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_FF_ID	   (4 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_2_REL_COUNT (5 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_VERTEX_COUNT	   (6 << 8)
-#define GEN6_SF_CTL_SNAPSHOT_MUX_SF_KERNEL_POINTER  (7 << 8)
-#define GEN6_SF_CTL_MIN_MAX_PRIMITIVE_RANGE_ENABLE  (1 << 4)
-#define GEN6_SF_CTL_DEBUG_CLIP_RECTANGLE_ENABLE	   (1 << 3)
-#define GEN6_SF_CTL_SNAPSHOT_ALL_THREADS		   (1 << 2)
-#define GEN6_SF_CTL_THREAD_SNAPSHOT_ENABLE	   (1 << 1)
-#define GEN6_SF_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_SF_STRG_VAL		       0x7b04
-#define GEN6_SF_RDATA		       0x7b18
-
-#define GEN6_WIZ_CTL		       0x7c00
-#define GEN6_WIZ_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_WIZ_CTL_SUBSPAN_INSTANCE_SHIFT	   16
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_WIZ_KERNEL_POINTER   (0 << 8)
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_SUBSPAN_INSTANCE     (1 << 8)
-#define GEN6_WIZ_CTL_SNAPSHOT_MUX_PRIMITIVE_SEQUENCE   (2 << 8)
-#define GEN6_WIZ_CTL_SINGLE_SUBSPAN_DISPATCH	      (1 << 6)
-#define GEN6_WIZ_CTL_IGNORE_COLOR_SCOREBOARD_STALLS    (1 << 5)
-#define GEN6_WIZ_CTL_ENABLE_SUBSPAN_INSTANCE_COMPARE   (1 << 4)
-#define GEN6_WIZ_CTL_USE_UPSTREAM_SNAPSHOT_FLAG	      (1 << 3)
-#define GEN6_WIZ_CTL_SNAPSHOT_ALL_THREADS	      (1 << 2)
-#define GEN6_WIZ_CTL_THREAD_SNAPSHOT_ENABLE	      (1 << 1)
-#define GEN6_WIZ_CTL_SNAPSHOT_ENABLE		      (1 << 0)
-
-#define GEN6_WIZ_STRG_VAL			      0x7c04
-#define GEN6_WIZ_RDATA				      0x7c18
-
-#define GEN6_TS_CTL		       0x7e00
-#define GEN6_TS_CTL_SNAPSHOT_COMPLETE		   (1 << 31)
-#define GEN6_TS_CTL_SNAPSHOT_MESSAGE_ERROR	   (0 << 8)
-#define GEN6_TS_CTL_SNAPSHOT_INTERFACE_DESCRIPTOR   (3 << 8)
-#define GEN6_TS_CTL_SNAPSHOT_ALL_CHILD_THREADS	   (1 << 2)
-#define GEN6_TS_CTL_SNAPSHOT_ALL_ROOT_THREADS  	   (1 << 1)
-#define GEN6_TS_CTL_SNAPSHOT_ENABLE		   (1 << 0)
-
-#define GEN6_TS_STRG_VAL		       0x7e04
-#define GEN6_TS_RDATA		       0x7e08
-
-/* TD_CTL on gen6 is 0x7000, to not break stuff which depends on this... */
-#ifndef GEN6_TD_CTL
-#define GEN6_TD_CTL                   0x8000
-#endif
-#define GEN6_TD_CTL_MUX_SHIFT	       8
-#define GEN6_TD_CTL_EXTERNAL_HALT_R0_DEBUG_MATCH	   (1 << 7)
-#define GEN6_TD_CTL_FORCE_EXTERNAL_HALT		   (1 << 6)
-#define GEN6_TD_CTL_EXCEPTION_MASK_OVERRIDE	   (1 << 5)
-#define GEN6_TD_CTL_FORCE_THREAD_BREAKPOINT_ENABLE  (1 << 4)
-#define GEN6_TD_CTL_BREAKPOINT_ENABLE		   (1 << 2)
-#define GEN6_TD_CTL2		       0x8004
-#define GEN6_TD_CTL2_ILLEGAL_OPCODE_EXCEPTION_OVERRIDE (1 << 28)
-#define GEN6_TD_CTL2_MASKSTACK_EXCEPTION_OVERRIDE      (1 << 26)
-#define GEN6_TD_CTL2_SOFTWARE_EXCEPTION_OVERRIDE	      (1 << 25)
-#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_SHIFT	      16
-#define GEN6_TD_CTL2_ACTIVE_THREAD_LIMIT_ENABLE	      (1 << 8)
-#define GEN6_TD_CTL2_THREAD_SPAWNER_EXECUTION_MASK_ENABLE (1 << 7)
-#define GEN6_TD_CTL2_WIZ_EXECUTION_MASK_ENABLE	      (1 << 6)
-#define GEN6_TD_CTL2_SF_EXECUTION_MASK_ENABLE	      (1 << 5)
-#define GEN6_TD_CTL2_CLIPPER_EXECUTION_MASK_ENABLE     (1 << 4)
-#define GEN6_TD_CTL2_GS_EXECUTION_MASK_ENABLE	      (1 << 3)
-#define GEN6_TD_CTL2_VS_EXECUTION_MASK_ENABLE	      (1 << 0)
-#define GEN6_TD_VF_VS_EMSK	       0x8008
-#define GEN6_TD_GS_EMSK		       0x800c
-#define GEN6_TD_CLIP_EMSK	       0x8010
-#define GEN6_TD_SF_EMSK		       0x8014
-#define GEN6_TD_WIZ_EMSK		       0x8018
-#define GEN6_TD_0_6_EHTRG_VAL	       0x801c
-#define GEN6_TD_0_7_EHTRG_VAL	       0x8020
-#define GEN6_TD_0_6_EHTRG_MSK           0x8024
-#define GEN6_TD_0_7_EHTRG_MSK	       0x8028
-#define GEN6_TD_RDATA		       0x802c
-#define GEN6_TD_TS_EMSK		       0x8030
-
-#define GEN6_EU_CTL		       0x8800
-#define GEN6_EU_CTL_SELECT_SHIFT	       16
-#define GEN6_EU_CTL_DATA_MUX_SHIFT      8
-#define GEN6_EU_ATT_0		       0x8810
-#define GEN6_EU_ATT_1		       0x8814
-#define GEN6_EU_ATT_DATA_0	       0x8820
-#define GEN6_EU_ATT_DATA_1	       0x8824
-#define GEN6_EU_ATT_CLR_0	       0x8830
-#define GEN6_EU_ATT_CLR_1	       0x8834
-#define GEN6_EU_RDATA		       0x8840
-
-/* 3D state:
- */
-#define _3DOP_3DSTATE_PIPELINED       0x0
-#define _3DOP_3DSTATE_NONPIPELINED    0x1
-#define _3DOP_3DCONTROL               0x2
-#define _3DOP_3DPRIMITIVE             0x3
-
-#define _3DSTATE_PIPELINED_POINTERS       0x00
-#define _3DSTATE_BINDING_TABLE_POINTERS   0x01
-#define _3DSTATE_VERTEX_BUFFERS           0x08
-#define _3DSTATE_VERTEX_ELEMENTS          0x09
-#define _3DSTATE_INDEX_BUFFER             0x0A
-#define _3DSTATE_VF_STATISTICS            0x0B
-#define _3DSTATE_DRAWING_RECTANGLE            0x00
-#define _3DSTATE_CONSTANT_COLOR               0x01
-#define _3DSTATE_SAMPLER_PALETTE_LOAD         0x02
-#define _3DSTATE_CHROMA_KEY                   0x04
-#define _3DSTATE_DEPTH_BUFFER                 0x05
-#define _3DSTATE_POLY_STIPPLE_OFFSET          0x06
-#define _3DSTATE_POLY_STIPPLE_PATTERN         0x07
-#define _3DSTATE_LINE_STIPPLE                 0x08
-#define _3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP    0x09
-#define _3DCONTROL    0x00
-#define _3DPRIMITIVE  0x00
-
-#define _3DPRIM_POINTLIST         0x01
-#define _3DPRIM_LINELIST          0x02
-#define _3DPRIM_LINESTRIP         0x03
-#define _3DPRIM_TRILIST           0x04
-#define _3DPRIM_TRISTRIP          0x05
-#define _3DPRIM_TRIFAN            0x06
-#define _3DPRIM_QUADLIST          0x07
-#define _3DPRIM_QUADSTRIP         0x08
-#define _3DPRIM_LINELIST_ADJ      0x09
-#define _3DPRIM_LINESTRIP_ADJ     0x0A
-#define _3DPRIM_TRILIST_ADJ       0x0B
-#define _3DPRIM_TRISTRIP_ADJ      0x0C
-#define _3DPRIM_TRISTRIP_REVERSE  0x0D
-#define _3DPRIM_POLYGON           0x0E
-#define _3DPRIM_RECTLIST          0x0F
-#define _3DPRIM_LINELOOP          0x10
-#define _3DPRIM_POINTLIST_BF      0x11
-#define _3DPRIM_LINESTRIP_CONT    0x12
-#define _3DPRIM_LINESTRIP_BF      0x13
-#define _3DPRIM_LINESTRIP_CONT_BF 0x14
-#define _3DPRIM_TRIFAN_NOSTIPPLE  0x15
-
-#define _3DPRIM_VERTEXBUFFER_ACCESS_SEQUENTIAL 0
-#define _3DPRIM_VERTEXBUFFER_ACCESS_RANDOM     1
-
-#define GEN6_ANISORATIO_2     0 
-#define GEN6_ANISORATIO_4     1 
-#define GEN6_ANISORATIO_6     2 
-#define GEN6_ANISORATIO_8     3 
-#define GEN6_ANISORATIO_10    4 
-#define GEN6_ANISORATIO_12    5 
-#define GEN6_ANISORATIO_14    6 
-#define GEN6_ANISORATIO_16    7
-
-#define GEN6_BLENDFACTOR_ONE                 0x1
-#define GEN6_BLENDFACTOR_SRC_COLOR           0x2
-#define GEN6_BLENDFACTOR_SRC_ALPHA           0x3
-#define GEN6_BLENDFACTOR_DST_ALPHA           0x4
-#define GEN6_BLENDFACTOR_DST_COLOR           0x5
-#define GEN6_BLENDFACTOR_SRC_ALPHA_SATURATE  0x6
-#define GEN6_BLENDFACTOR_CONST_COLOR         0x7
-#define GEN6_BLENDFACTOR_CONST_ALPHA         0x8
-#define GEN6_BLENDFACTOR_SRC1_COLOR          0x9
-#define GEN6_BLENDFACTOR_SRC1_ALPHA          0x0A
-#define GEN6_BLENDFACTOR_ZERO                0x11
-#define GEN6_BLENDFACTOR_INV_SRC_COLOR       0x12
-#define GEN6_BLENDFACTOR_INV_SRC_ALPHA       0x13
-#define GEN6_BLENDFACTOR_INV_DST_ALPHA       0x14
-#define GEN6_BLENDFACTOR_INV_DST_COLOR       0x15
-#define GEN6_BLENDFACTOR_INV_CONST_COLOR     0x17
-#define GEN6_BLENDFACTOR_INV_CONST_ALPHA     0x18
-#define GEN6_BLENDFACTOR_INV_SRC1_COLOR      0x19
-#define GEN6_BLENDFACTOR_INV_SRC1_ALPHA      0x1A
-
-#define GEN6_BLENDFUNCTION_ADD               0
-#define GEN6_BLENDFUNCTION_SUBTRACT          1
-#define GEN6_BLENDFUNCTION_REVERSE_SUBTRACT  2
-#define GEN6_BLENDFUNCTION_MIN               3
-#define GEN6_BLENDFUNCTION_MAX               4
-
-#define GEN6_ALPHATEST_FORMAT_UNORM8         0
-#define GEN6_ALPHATEST_FORMAT_FLOAT32        1
-
-#define GEN6_CHROMAKEY_KILL_ON_ANY_MATCH  0
-#define GEN6_CHROMAKEY_REPLACE_BLACK      1
-
-#define GEN6_CLIP_API_OGL     0
-#define GEN6_CLIP_API_DX      1
-
-#define GEN6_CLIPMODE_NORMAL              0
-#define GEN6_CLIPMODE_CLIP_ALL            1
-#define GEN6_CLIPMODE_CLIP_NON_REJECTED   2
-#define GEN6_CLIPMODE_REJECT_ALL          3
-#define GEN6_CLIPMODE_ACCEPT_ALL          4
-
-#define GEN6_CLIP_NDCSPACE     0
-#define GEN6_CLIP_SCREENSPACE  1
-
-#define GEN6_COMPAREFUNCTION_ALWAYS       0
-#define GEN6_COMPAREFUNCTION_NEVER        1
-#define GEN6_COMPAREFUNCTION_LESS         2
-#define GEN6_COMPAREFUNCTION_EQUAL        3
-#define GEN6_COMPAREFUNCTION_LEQUAL       4
-#define GEN6_COMPAREFUNCTION_GREATER      5
-#define GEN6_COMPAREFUNCTION_NOTEQUAL     6
-#define GEN6_COMPAREFUNCTION_GEQUAL       7
-
-#define GEN6_COVERAGE_PIXELS_HALF     0
-#define GEN6_COVERAGE_PIXELS_1        1
-#define GEN6_COVERAGE_PIXELS_2        2
-#define GEN6_COVERAGE_PIXELS_4        3
-
-#define GEN6_CULLMODE_BOTH        0
-#define GEN6_CULLMODE_NONE        1
-#define GEN6_CULLMODE_FRONT       2
-#define GEN6_CULLMODE_BACK        3
-
-#define GEN6_DEFAULTCOLOR_R8G8B8A8_UNORM      0
-#define GEN6_DEFAULTCOLOR_R32G32B32A32_FLOAT  1
-
-#define GEN6_DEPTHFORMAT_D32_FLOAT_S8X24_UINT     0
-#define GEN6_DEPTHFORMAT_D32_FLOAT                1
-#define GEN6_DEPTHFORMAT_D24_UNORM_S8_UINT        2
-#define GEN6_DEPTHFORMAT_D16_UNORM                5
-
-#define GEN6_FLOATING_POINT_IEEE_754        0
-#define GEN6_FLOATING_POINT_NON_IEEE_754    1
-
-#define GEN6_FRONTWINDING_CW      0
-#define GEN6_FRONTWINDING_CCW     1
-
-#define GEN6_INDEX_BYTE     0
-#define GEN6_INDEX_WORD     1
-#define GEN6_INDEX_DWORD    2
-
-#define GEN6_LOGICOPFUNCTION_CLEAR            0
-#define GEN6_LOGICOPFUNCTION_NOR              1
-#define GEN6_LOGICOPFUNCTION_AND_INVERTED     2
-#define GEN6_LOGICOPFUNCTION_COPY_INVERTED    3
-#define GEN6_LOGICOPFUNCTION_AND_REVERSE      4
-#define GEN6_LOGICOPFUNCTION_INVERT           5
-#define GEN6_LOGICOPFUNCTION_XOR              6
-#define GEN6_LOGICOPFUNCTION_NAND             7
-#define GEN6_LOGICOPFUNCTION_AND              8
-#define GEN6_LOGICOPFUNCTION_EQUIV            9
-#define GEN6_LOGICOPFUNCTION_NOOP             10
-#define GEN6_LOGICOPFUNCTION_OR_INVERTED      11
-#define GEN6_LOGICOPFUNCTION_COPY             12
-#define GEN6_LOGICOPFUNCTION_OR_REVERSE       13
-#define GEN6_LOGICOPFUNCTION_OR               14
-#define GEN6_LOGICOPFUNCTION_SET              15  
-
-#define GEN6_MAPFILTER_NEAREST        0x0 
-#define GEN6_MAPFILTER_LINEAR         0x1 
-#define GEN6_MAPFILTER_ANISOTROPIC    0x2
-
-#define GEN6_MIPFILTER_NONE        0   
-#define GEN6_MIPFILTER_NEAREST     1   
-#define GEN6_MIPFILTER_LINEAR      3
-
-#define GEN6_POLYGON_FRONT_FACING     0
-#define GEN6_POLYGON_BACK_FACING      1
-
-#define GEN6_PREFILTER_ALWAYS     0x0 
-#define GEN6_PREFILTER_NEVER      0x1
-#define GEN6_PREFILTER_LESS       0x2
-#define GEN6_PREFILTER_EQUAL      0x3
-#define GEN6_PREFILTER_LEQUAL     0x4
-#define GEN6_PREFILTER_GREATER    0x5
-#define GEN6_PREFILTER_NOTEQUAL   0x6
-#define GEN6_PREFILTER_GEQUAL     0x7
-
-#define GEN6_PROVOKING_VERTEX_0    0
-#define GEN6_PROVOKING_VERTEX_1    1 
-#define GEN6_PROVOKING_VERTEX_2    2
-
-#define GEN6_RASTRULE_UPPER_LEFT  0    
-#define GEN6_RASTRULE_UPPER_RIGHT 1
-
-#define GEN6_RENDERTARGET_CLAMPRANGE_UNORM    0
-#define GEN6_RENDERTARGET_CLAMPRANGE_SNORM    1
-#define GEN6_RENDERTARGET_CLAMPRANGE_FORMAT   2
-
-#define GEN6_STENCILOP_KEEP               0
-#define GEN6_STENCILOP_ZERO               1
-#define GEN6_STENCILOP_REPLACE            2
-#define GEN6_STENCILOP_INCRSAT            3
-#define GEN6_STENCILOP_DECRSAT            4
-#define GEN6_STENCILOP_INCR               5
-#define GEN6_STENCILOP_DECR               6
-#define GEN6_STENCILOP_INVERT             7
-
-#define GEN6_SURFACE_MIPMAPLAYOUT_BELOW   0
-#define GEN6_SURFACE_MIPMAPLAYOUT_RIGHT   1
-
-#define GEN6_SURFACEFORMAT_R32G32B32A32_FLOAT             0x000
-#define GEN6_SURFACEFORMAT_R32G32B32A32_SINT              0x001
-#define GEN6_SURFACEFORMAT_R32G32B32A32_UINT              0x002
-#define GEN6_SURFACEFORMAT_R32G32B32A32_UNORM             0x003
-#define GEN6_SURFACEFORMAT_R32G32B32A32_SNORM             0x004
-#define GEN6_SURFACEFORMAT_R64G64_FLOAT                   0x005
-#define GEN6_SURFACEFORMAT_R32G32B32X32_FLOAT             0x006
-#define GEN6_SURFACEFORMAT_R32G32B32A32_SSCALED           0x007
-#define GEN6_SURFACEFORMAT_R32G32B32A32_USCALED           0x008
-#define GEN6_SURFACEFORMAT_R32G32B32_FLOAT                0x040
-#define GEN6_SURFACEFORMAT_R32G32B32_SINT                 0x041
-#define GEN6_SURFACEFORMAT_R32G32B32_UINT                 0x042
-#define GEN6_SURFACEFORMAT_R32G32B32_UNORM                0x043
-#define GEN6_SURFACEFORMAT_R32G32B32_SNORM                0x044
-#define GEN6_SURFACEFORMAT_R32G32B32_SSCALED              0x045
-#define GEN6_SURFACEFORMAT_R32G32B32_USCALED              0x046
-#define GEN6_SURFACEFORMAT_R16G16B16A16_UNORM             0x080
-#define GEN6_SURFACEFORMAT_R16G16B16A16_SNORM             0x081
-#define GEN6_SURFACEFORMAT_R16G16B16A16_SINT              0x082
-#define GEN6_SURFACEFORMAT_R16G16B16A16_UINT              0x083
-#define GEN6_SURFACEFORMAT_R16G16B16A16_FLOAT             0x084
-#define GEN6_SURFACEFORMAT_R32G32_FLOAT                   0x085
-#define GEN6_SURFACEFORMAT_R32G32_SINT                    0x086
-#define GEN6_SURFACEFORMAT_R32G32_UINT                    0x087
-#define GEN6_SURFACEFORMAT_R32_FLOAT_X8X24_TYPELESS       0x088
-#define GEN6_SURFACEFORMAT_X32_TYPELESS_G8X24_UINT        0x089
-#define GEN6_SURFACEFORMAT_L32A32_FLOAT                   0x08A
-#define GEN6_SURFACEFORMAT_R32G32_UNORM                   0x08B
-#define GEN6_SURFACEFORMAT_R32G32_SNORM                   0x08C
-#define GEN6_SURFACEFORMAT_R64_FLOAT                      0x08D
-#define GEN6_SURFACEFORMAT_R16G16B16X16_UNORM             0x08E
-#define GEN6_SURFACEFORMAT_R16G16B16X16_FLOAT             0x08F
-#define GEN6_SURFACEFORMAT_A32X32_FLOAT                   0x090
-#define GEN6_SURFACEFORMAT_L32X32_FLOAT                   0x091
-#define GEN6_SURFACEFORMAT_I32X32_FLOAT                   0x092
-#define GEN6_SURFACEFORMAT_R16G16B16A16_SSCALED           0x093
-#define GEN6_SURFACEFORMAT_R16G16B16A16_USCALED           0x094
-#define GEN6_SURFACEFORMAT_R32G32_SSCALED                 0x095
-#define GEN6_SURFACEFORMAT_R32G32_USCALED                 0x096
-#define GEN6_SURFACEFORMAT_B8G8R8A8_UNORM                 0x0C0
-#define GEN6_SURFACEFORMAT_B8G8R8A8_UNORM_SRGB            0x0C1
-#define GEN6_SURFACEFORMAT_R10G10B10A2_UNORM              0x0C2
-#define GEN6_SURFACEFORMAT_R10G10B10A2_UNORM_SRGB         0x0C3
-#define GEN6_SURFACEFORMAT_R10G10B10A2_UINT               0x0C4
-#define GEN6_SURFACEFORMAT_R10G10B10_SNORM_A2_UNORM       0x0C5
-#define GEN6_SURFACEFORMAT_R8G8B8A8_UNORM                 0x0C7
-#define GEN6_SURFACEFORMAT_R8G8B8A8_UNORM_SRGB            0x0C8
-#define GEN6_SURFACEFORMAT_R8G8B8A8_SNORM                 0x0C9
-#define GEN6_SURFACEFORMAT_R8G8B8A8_SINT                  0x0CA
-#define GEN6_SURFACEFORMAT_R8G8B8A8_UINT                  0x0CB
-#define GEN6_SURFACEFORMAT_R16G16_UNORM                   0x0CC
-#define GEN6_SURFACEFORMAT_R16G16_SNORM                   0x0CD
-#define GEN6_SURFACEFORMAT_R16G16_SINT                    0x0CE
-#define GEN6_SURFACEFORMAT_R16G16_UINT                    0x0CF
-#define GEN6_SURFACEFORMAT_R16G16_FLOAT                   0x0D0
-#define GEN6_SURFACEFORMAT_B10G10R10A2_UNORM              0x0D1
-#define GEN6_SURFACEFORMAT_B10G10R10A2_UNORM_SRGB         0x0D2
-#define GEN6_SURFACEFORMAT_R11G11B10_FLOAT                0x0D3
-#define GEN6_SURFACEFORMAT_R32_SINT                       0x0D6
-#define GEN6_SURFACEFORMAT_R32_UINT                       0x0D7
-#define GEN6_SURFACEFORMAT_R32_FLOAT                      0x0D8
-#define GEN6_SURFACEFORMAT_R24_UNORM_X8_TYPELESS          0x0D9
-#define GEN6_SURFACEFORMAT_X24_TYPELESS_G8_UINT           0x0DA
-#define GEN6_SURFACEFORMAT_L16A16_UNORM                   0x0DF
-#define GEN6_SURFACEFORMAT_I24X8_UNORM                    0x0E0
-#define GEN6_SURFACEFORMAT_L24X8_UNORM                    0x0E1
-#define GEN6_SURFACEFORMAT_A24X8_UNORM                    0x0E2
-#define GEN6_SURFACEFORMAT_I32_FLOAT                      0x0E3
-#define GEN6_SURFACEFORMAT_L32_FLOAT                      0x0E4
-#define GEN6_SURFACEFORMAT_A32_FLOAT                      0x0E5
-#define GEN6_SURFACEFORMAT_B8G8R8X8_UNORM                 0x0E9
-#define GEN6_SURFACEFORMAT_B8G8R8X8_UNORM_SRGB            0x0EA
-#define GEN6_SURFACEFORMAT_R8G8B8X8_UNORM                 0x0EB
-#define GEN6_SURFACEFORMAT_R8G8B8X8_UNORM_SRGB            0x0EC
-#define GEN6_SURFACEFORMAT_R9G9B9E5_SHAREDEXP             0x0ED
-#define GEN6_SURFACEFORMAT_B10G10R10X2_UNORM              0x0EE
-#define GEN6_SURFACEFORMAT_L16A16_FLOAT                   0x0F0
-#define GEN6_SURFACEFORMAT_R32_UNORM                      0x0F1
-#define GEN6_SURFACEFORMAT_R32_SNORM                      0x0F2
-#define GEN6_SURFACEFORMAT_R10G10B10X2_USCALED            0x0F3
-#define GEN6_SURFACEFORMAT_R8G8B8A8_SSCALED               0x0F4
-#define GEN6_SURFACEFORMAT_R8G8B8A8_USCALED               0x0F5
-#define GEN6_SURFACEFORMAT_R16G16_SSCALED                 0x0F6
-#define GEN6_SURFACEFORMAT_R16G16_USCALED                 0x0F7
-#define GEN6_SURFACEFORMAT_R32_SSCALED                    0x0F8
-#define GEN6_SURFACEFORMAT_R32_USCALED                    0x0F9
-#define GEN6_SURFACEFORMAT_B5G6R5_UNORM                   0x100
-#define GEN6_SURFACEFORMAT_B5G6R5_UNORM_SRGB              0x101
-#define GEN6_SURFACEFORMAT_B5G5R5A1_UNORM                 0x102
-#define GEN6_SURFACEFORMAT_B5G5R5A1_UNORM_SRGB            0x103
-#define GEN6_SURFACEFORMAT_B4G4R4A4_UNORM                 0x104
-#define GEN6_SURFACEFORMAT_B4G4R4A4_UNORM_SRGB            0x105
-#define GEN6_SURFACEFORMAT_R8G8_UNORM                     0x106
-#define GEN6_SURFACEFORMAT_R8G8_SNORM                     0x107
-#define GEN6_SURFACEFORMAT_R8G8_SINT                      0x108
-#define GEN6_SURFACEFORMAT_R8G8_UINT                      0x109
-#define GEN6_SURFACEFORMAT_R16_UNORM                      0x10A
-#define GEN6_SURFACEFORMAT_R16_SNORM                      0x10B
-#define GEN6_SURFACEFORMAT_R16_SINT                       0x10C
-#define GEN6_SURFACEFORMAT_R16_UINT                       0x10D
-#define GEN6_SURFACEFORMAT_R16_FLOAT                      0x10E
-#define GEN6_SURFACEFORMAT_I16_UNORM                      0x111
-#define GEN6_SURFACEFORMAT_L16_UNORM                      0x112
-#define GEN6_SURFACEFORMAT_A16_UNORM                      0x113
-#define GEN6_SURFACEFORMAT_L8A8_UNORM                     0x114
-#define GEN6_SURFACEFORMAT_I16_FLOAT                      0x115
-#define GEN6_SURFACEFORMAT_L16_FLOAT                      0x116
-#define GEN6_SURFACEFORMAT_A16_FLOAT                      0x117
-#define GEN6_SURFACEFORMAT_R5G5_SNORM_B6_UNORM            0x119
-#define GEN6_SURFACEFORMAT_B5G5R5X1_UNORM                 0x11A
-#define GEN6_SURFACEFORMAT_B5G5R5X1_UNORM_SRGB            0x11B
-#define GEN6_SURFACEFORMAT_R8G8_SSCALED                   0x11C
-#define GEN6_SURFACEFORMAT_R8G8_USCALED                   0x11D
-#define GEN6_SURFACEFORMAT_R16_SSCALED                    0x11E
-#define GEN6_SURFACEFORMAT_R16_USCALED                    0x11F
-#define GEN6_SURFACEFORMAT_R8_UNORM                       0x140
-#define GEN6_SURFACEFORMAT_R8_SNORM                       0x141
-#define GEN6_SURFACEFORMAT_R8_SINT                        0x142
-#define GEN6_SURFACEFORMAT_R8_UINT                        0x143
-#define GEN6_SURFACEFORMAT_A8_UNORM                       0x144
-#define GEN6_SURFACEFORMAT_I8_UNORM                       0x145
-#define GEN6_SURFACEFORMAT_L8_UNORM                       0x146
-#define GEN6_SURFACEFORMAT_P4A4_UNORM                     0x147
-#define GEN6_SURFACEFORMAT_A4P4_UNORM                     0x148
-#define GEN6_SURFACEFORMAT_R8_SSCALED                     0x149
-#define GEN6_SURFACEFORMAT_R8_USCALED                     0x14A
-#define GEN6_SURFACEFORMAT_R1_UINT                        0x181
-#define GEN6_SURFACEFORMAT_YCRCB_NORMAL                   0x182
-#define GEN6_SURFACEFORMAT_YCRCB_SWAPUVY                  0x183
-#define GEN6_SURFACEFORMAT_BC1_UNORM                      0x186
-#define GEN6_SURFACEFORMAT_BC2_UNORM                      0x187
-#define GEN6_SURFACEFORMAT_BC3_UNORM                      0x188
-#define GEN6_SURFACEFORMAT_BC4_UNORM                      0x189
-#define GEN6_SURFACEFORMAT_BC5_UNORM                      0x18A
-#define GEN6_SURFACEFORMAT_BC1_UNORM_SRGB                 0x18B
-#define GEN6_SURFACEFORMAT_BC2_UNORM_SRGB                 0x18C
-#define GEN6_SURFACEFORMAT_BC3_UNORM_SRGB                 0x18D
-#define GEN6_SURFACEFORMAT_MONO8                          0x18E
-#define GEN6_SURFACEFORMAT_YCRCB_SWAPUV                   0x18F
-#define GEN6_SURFACEFORMAT_YCRCB_SWAPY                    0x190
-#define GEN6_SURFACEFORMAT_DXT1_RGB                       0x191
-#define GEN6_SURFACEFORMAT_FXT1                           0x192
-#define GEN6_SURFACEFORMAT_R8G8B8_UNORM                   0x193
-#define GEN6_SURFACEFORMAT_R8G8B8_SNORM                   0x194
-#define GEN6_SURFACEFORMAT_R8G8B8_SSCALED                 0x195
-#define GEN6_SURFACEFORMAT_R8G8B8_USCALED                 0x196
-#define GEN6_SURFACEFORMAT_R64G64B64A64_FLOAT             0x197
-#define GEN6_SURFACEFORMAT_R64G64B64_FLOAT                0x198
-#define GEN6_SURFACEFORMAT_BC4_SNORM                      0x199
-#define GEN6_SURFACEFORMAT_BC5_SNORM                      0x19A
-#define GEN6_SURFACEFORMAT_R16G16B16_UNORM                0x19C
-#define GEN6_SURFACEFORMAT_R16G16B16_SNORM                0x19D
-#define GEN6_SURFACEFORMAT_R16G16B16_SSCALED              0x19E
-#define GEN6_SURFACEFORMAT_R16G16B16_USCALED              0x19F
-
-#define GEN6_SURFACERETURNFORMAT_FLOAT32  0
-#define GEN6_SURFACERETURNFORMAT_S1       1
-
-#define GEN6_SURFACE_1D      0
-#define GEN6_SURFACE_2D      1
-#define GEN6_SURFACE_3D      2
-#define GEN6_SURFACE_CUBE    3
-#define GEN6_SURFACE_BUFFER  4
-#define GEN6_SURFACE_NULL    7
-
-#define GEN6_BORDER_COLOR_MODE_DEFAULT	0
-#define GEN6_BORDER_COLOR_MODE_LEGACY	1
-
-#define GEN6_TEXCOORDMODE_WRAP            0
-#define GEN6_TEXCOORDMODE_MIRROR          1
-#define GEN6_TEXCOORDMODE_CLAMP           2
-#define GEN6_TEXCOORDMODE_CUBE            3
-#define GEN6_TEXCOORDMODE_CLAMP_BORDER    4
-#define GEN6_TEXCOORDMODE_MIRROR_ONCE     5
-
-#define GEN6_THREAD_PRIORITY_NORMAL   0
-#define GEN6_THREAD_PRIORITY_HIGH     1
-
-#define GEN6_TILEWALK_XMAJOR                 0
-#define GEN6_TILEWALK_YMAJOR                 1
-
-#define GEN6_VERTEX_SUBPIXEL_PRECISION_8BITS  0
-#define GEN6_VERTEX_SUBPIXEL_PRECISION_4BITS  1
-
-#define GEN6_VERTEXBUFFER_ACCESS_VERTEXDATA     0
-#define GEN6_VERTEXBUFFER_ACCESS_INSTANCEDATA   1
-
-#define GEN6_VFCOMPONENT_NOSTORE      0
-#define GEN6_VFCOMPONENT_STORE_SRC    1
-#define GEN6_VFCOMPONENT_STORE_0      2
-#define GEN6_VFCOMPONENT_STORE_1_FLT  3
-#define GEN6_VFCOMPONENT_STORE_1_INT  4
-#define GEN6_VFCOMPONENT_STORE_VID    5
-#define GEN6_VFCOMPONENT_STORE_IID    6
-#define GEN6_VFCOMPONENT_STORE_PID    7
-
-
-
-/* Execution Unit (EU) defines
- */
-
-#define GEN6_ALIGN_1   0
-#define GEN6_ALIGN_16  1
-
-#define GEN6_ADDRESS_DIRECT                        0
-#define GEN6_ADDRESS_REGISTER_INDIRECT_REGISTER    1
-
-#define GEN6_CHANNEL_X     0
-#define GEN6_CHANNEL_Y     1
-#define GEN6_CHANNEL_Z     2
-#define GEN6_CHANNEL_W     3
-
-#define GEN6_COMPRESSION_NONE          0
-#define GEN6_COMPRESSION_2NDHALF       1
-#define GEN6_COMPRESSION_COMPRESSED    2
-
-#define GEN6_CONDITIONAL_NONE  0
-#define GEN6_CONDITIONAL_Z     1
-#define GEN6_CONDITIONAL_NZ    2
-#define GEN6_CONDITIONAL_EQ    1	/* Z */
-#define GEN6_CONDITIONAL_NEQ   2	/* NZ */
-#define GEN6_CONDITIONAL_G     3
-#define GEN6_CONDITIONAL_GE    4
-#define GEN6_CONDITIONAL_L     5
-#define GEN6_CONDITIONAL_LE    6
-#define GEN6_CONDITIONAL_C     7
-#define GEN6_CONDITIONAL_O     8
-
-#define GEN6_DEBUG_NONE        0
-#define GEN6_DEBUG_BREAKPOINT  1
-
-#define GEN6_DEPENDENCY_NORMAL         0
-#define GEN6_DEPENDENCY_NOTCLEARED     1
-#define GEN6_DEPENDENCY_NOTCHECKED     2
-#define GEN6_DEPENDENCY_DISABLE        3
-
-#define GEN6_EXECUTE_1     0
-#define GEN6_EXECUTE_2     1
-#define GEN6_EXECUTE_4     2
-#define GEN6_EXECUTE_8     3
-#define GEN6_EXECUTE_16    4
-#define GEN6_EXECUTE_32    5
-
-#define GEN6_HORIZONTAL_STRIDE_0   0
-#define GEN6_HORIZONTAL_STRIDE_1   1
-#define GEN6_HORIZONTAL_STRIDE_2   2
-#define GEN6_HORIZONTAL_STRIDE_4   3
-
-#define GEN6_INSTRUCTION_NORMAL    0
-#define GEN6_INSTRUCTION_SATURATE  1
-
-#define GEN6_MASK_ENABLE   0
-#define GEN6_MASK_DISABLE  1
-
-#define GEN6_OPCODE_MOV        1
-#define GEN6_OPCODE_SEL        2
-#define GEN6_OPCODE_NOT        4
-#define GEN6_OPCODE_AND        5
-#define GEN6_OPCODE_OR         6
-#define GEN6_OPCODE_XOR        7
-#define GEN6_OPCODE_SHR        8
-#define GEN6_OPCODE_SHL        9
-#define GEN6_OPCODE_RSR        10
-#define GEN6_OPCODE_RSL        11
-#define GEN6_OPCODE_ASR        12
-#define GEN6_OPCODE_CMP        16
-#define GEN6_OPCODE_JMPI       32
-#define GEN6_OPCODE_IF         34
-#define GEN6_OPCODE_IFF        35
-#define GEN6_OPCODE_ELSE       36
-#define GEN6_OPCODE_ENDIF      37
-#define GEN6_OPCODE_DO         38
-#define GEN6_OPCODE_WHILE      39
-#define GEN6_OPCODE_BREAK      40
-#define GEN6_OPCODE_CONTINUE   41
-#define GEN6_OPCODE_HALT       42
-#define GEN6_OPCODE_MSAVE      44
-#define GEN6_OPCODE_MRESTORE   45
-#define GEN6_OPCODE_PUSH       46
-#define GEN6_OPCODE_POP        47
-#define GEN6_OPCODE_WAIT       48
-#define GEN6_OPCODE_SEND       49
-#define GEN6_OPCODE_ADD        64
-#define GEN6_OPCODE_MUL        65
-#define GEN6_OPCODE_AVG        66
-#define GEN6_OPCODE_FRC        67
-#define GEN6_OPCODE_RNDU       68
-#define GEN6_OPCODE_RNDD       69
-#define GEN6_OPCODE_RNDE       70
-#define GEN6_OPCODE_RNDZ       71
-#define GEN6_OPCODE_MAC        72
-#define GEN6_OPCODE_MACH       73
-#define GEN6_OPCODE_LZD        74
-#define GEN6_OPCODE_SAD2       80
-#define GEN6_OPCODE_SADA2      81
-#define GEN6_OPCODE_DP4        84
-#define GEN6_OPCODE_DPH        85
-#define GEN6_OPCODE_DP3        86
-#define GEN6_OPCODE_DP2        87
-#define GEN6_OPCODE_DPA2       88
-#define GEN6_OPCODE_LINE       89
-#define GEN6_OPCODE_NOP        126
-
-#define GEN6_PREDICATE_NONE             0
-#define GEN6_PREDICATE_NORMAL           1
-#define GEN6_PREDICATE_ALIGN1_ANYV             2
-#define GEN6_PREDICATE_ALIGN1_ALLV             3
-#define GEN6_PREDICATE_ALIGN1_ANY2H            4
-#define GEN6_PREDICATE_ALIGN1_ALL2H            5
-#define GEN6_PREDICATE_ALIGN1_ANY4H            6
-#define GEN6_PREDICATE_ALIGN1_ALL4H            7
-#define GEN6_PREDICATE_ALIGN1_ANY8H            8
-#define GEN6_PREDICATE_ALIGN1_ALL8H            9
-#define GEN6_PREDICATE_ALIGN1_ANY16H           10
-#define GEN6_PREDICATE_ALIGN1_ALL16H           11
-#define GEN6_PREDICATE_ALIGN16_REPLICATE_X     2
-#define GEN6_PREDICATE_ALIGN16_REPLICATE_Y     3
-#define GEN6_PREDICATE_ALIGN16_REPLICATE_Z     4
-#define GEN6_PREDICATE_ALIGN16_REPLICATE_W     5
-#define GEN6_PREDICATE_ALIGN16_ANY4H           6
-#define GEN6_PREDICATE_ALIGN16_ALL4H           7
-
-#define GEN6_ARCHITECTURE_REGISTER_FILE    0
-#define GEN6_GENERAL_REGISTER_FILE         1
-#define GEN6_MESSAGE_REGISTER_FILE         2
-#define GEN6_IMMEDIATE_VALUE               3
-
-#define GEN6_REGISTER_TYPE_UD  0
-#define GEN6_REGISTER_TYPE_D   1
-#define GEN6_REGISTER_TYPE_UW  2
-#define GEN6_REGISTER_TYPE_W   3
-#define GEN6_REGISTER_TYPE_UB  4
-#define GEN6_REGISTER_TYPE_B   5
-#define GEN6_REGISTER_TYPE_VF  5	/* packed float vector, immediates only? */
-#define GEN6_REGISTER_TYPE_HF  6
-#define GEN6_REGISTER_TYPE_V   6	/* packed int vector, immediates only, uword dest only */
-#define GEN6_REGISTER_TYPE_F   7
-
-#define GEN6_ARF_NULL                  0x00
-#define GEN6_ARF_ADDRESS               0x10
-#define GEN6_ARF_ACCUMULATOR           0x20   
-#define GEN6_ARF_FLAG                  0x30
-#define GEN6_ARF_MASK                  0x40
-#define GEN6_ARF_MASK_STACK            0x50
-#define GEN6_ARF_MASK_STACK_DEPTH      0x60
-#define GEN6_ARF_STATE                 0x70
-#define GEN6_ARF_CONTROL               0x80
-#define GEN6_ARF_NOTIFICATION_COUNT    0x90
-#define GEN6_ARF_IP                    0xA0
-
-#define GEN6_AMASK   0
-#define GEN6_IMASK   1
-#define GEN6_LMASK   2
-#define GEN6_CMASK   3
-
-
-
-#define GEN6_THREAD_NORMAL     0
-#define GEN6_THREAD_ATOMIC     1
-#define GEN6_THREAD_SWITCH     2
-
-#define GEN6_VERTICAL_STRIDE_0                 0
-#define GEN6_VERTICAL_STRIDE_1                 1
-#define GEN6_VERTICAL_STRIDE_2                 2
-#define GEN6_VERTICAL_STRIDE_4                 3
-#define GEN6_VERTICAL_STRIDE_8                 4
-#define GEN6_VERTICAL_STRIDE_16                5
-#define GEN6_VERTICAL_STRIDE_32                6
-#define GEN6_VERTICAL_STRIDE_64                7
-#define GEN6_VERTICAL_STRIDE_128               8
-#define GEN6_VERTICAL_STRIDE_256               9
-#define GEN6_VERTICAL_STRIDE_ONE_DIMENSIONAL   0xF
-
-#define GEN6_WIDTH_1       0
-#define GEN6_WIDTH_2       1
-#define GEN6_WIDTH_4       2
-#define GEN6_WIDTH_8       3
-#define GEN6_WIDTH_16      4
-
-#define GEN6_STATELESS_BUFFER_BOUNDARY_1K      0
-#define GEN6_STATELESS_BUFFER_BOUNDARY_2K      1
-#define GEN6_STATELESS_BUFFER_BOUNDARY_4K      2
-#define GEN6_STATELESS_BUFFER_BOUNDARY_8K      3
-#define GEN6_STATELESS_BUFFER_BOUNDARY_16K     4
-#define GEN6_STATELESS_BUFFER_BOUNDARY_32K     5
-#define GEN6_STATELESS_BUFFER_BOUNDARY_64K     6
-#define GEN6_STATELESS_BUFFER_BOUNDARY_128K    7
-#define GEN6_STATELESS_BUFFER_BOUNDARY_256K    8
-#define GEN6_STATELESS_BUFFER_BOUNDARY_512K    9
-#define GEN6_STATELESS_BUFFER_BOUNDARY_1M      10
-#define GEN6_STATELESS_BUFFER_BOUNDARY_2M      11
-
-#define GEN6_POLYGON_FACING_FRONT      0
-#define GEN6_POLYGON_FACING_BACK       1
-
-#define GEN6_MESSAGE_TARGET_NULL               0
-#define GEN6_MESSAGE_TARGET_MATH               1
-#define GEN6_MESSAGE_TARGET_SAMPLER            2
-#define GEN6_MESSAGE_TARGET_GATEWAY            3
-#define GEN6_MESSAGE_TARGET_DATAPORT_READ      4
-#define GEN6_MESSAGE_TARGET_DATAPORT_WRITE     5
-#define GEN6_MESSAGE_TARGET_URB                6
-#define GEN6_MESSAGE_TARGET_THREAD_SPAWNER     7
-
-#define GEN6_SAMPLER_RETURN_FORMAT_FLOAT32     0
-#define GEN6_SAMPLER_RETURN_FORMAT_UINT32      2
-#define GEN6_SAMPLER_RETURN_FORMAT_SINT32      3
-
-#define GEN6_SAMPLER_MESSAGE_SIMD8_SAMPLE              0
-#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE             0
-#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_BIAS        0
-#define GEN6_SAMPLER_MESSAGE_SIMD8_KILLPIX             1
-#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_LOD        1
-#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_LOD         1
-#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_GRADIENTS  2
-#define GEN6_SAMPLER_MESSAGE_SIMD8_SAMPLE_GRADIENTS    2
-#define GEN6_SAMPLER_MESSAGE_SIMD4X2_SAMPLE_COMPARE    0
-#define GEN6_SAMPLER_MESSAGE_SIMD16_SAMPLE_COMPARE     2
-#define GEN6_SAMPLER_MESSAGE_SIMD4X2_RESINFO           2
-#define GEN6_SAMPLER_MESSAGE_SIMD8_RESINFO             2
-#define GEN6_SAMPLER_MESSAGE_SIMD16_RESINFO            2
-#define GEN6_SAMPLER_MESSAGE_SIMD4X2_LD                3
-#define GEN6_SAMPLER_MESSAGE_SIMD8_LD                  3
-#define GEN6_SAMPLER_MESSAGE_SIMD16_LD                 3
-
-#define GEN6_DATAPORT_OWORD_BLOCK_1_OWORDLOW   0
-#define GEN6_DATAPORT_OWORD_BLOCK_1_OWORDHIGH  1
-#define GEN6_DATAPORT_OWORD_BLOCK_2_OWORDS     2
-#define GEN6_DATAPORT_OWORD_BLOCK_4_OWORDS     3
-#define GEN6_DATAPORT_OWORD_BLOCK_8_OWORDS     4
-
-#define GEN6_DATAPORT_OWORD_DUAL_BLOCK_1OWORD     0
-#define GEN6_DATAPORT_OWORD_DUAL_BLOCK_4OWORDS    2
-
-#define GEN6_DATAPORT_DWORD_SCATTERED_BLOCK_8DWORDS   2
-#define GEN6_DATAPORT_DWORD_SCATTERED_BLOCK_16DWORDS  3
-
-#define GEN6_DATAPORT_READ_MESSAGE_OWORD_BLOCK_READ          0
-#define GEN6_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ     1
-#define GEN6_DATAPORT_READ_MESSAGE_DWORD_BLOCK_READ          2
-#define GEN6_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ      3
-
-#define GEN6_DATAPORT_READ_TARGET_DATA_CACHE      0
-#define GEN6_DATAPORT_READ_TARGET_RENDER_CACHE    1
-#define GEN6_DATAPORT_READ_TARGET_SAMPLER_CACHE   2
-
-#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE                0
-#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD16_SINGLE_SOURCE_REPLICATED     1
-#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN01         2
-#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_DUAL_SOURCE_SUBSPAN23         3
-#define GEN6_DATAPORT_RENDER_TARGET_WRITE_SIMD8_SINGLE_SOURCE_SUBSPAN01       4
-
-#define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE                0
-#define GEN6_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE           1
-#define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_BLOCK_WRITE                2
-#define GEN6_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE            3
-#define GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE              4
-#define GEN6_DATAPORT_WRITE_MESSAGE_STREAMED_VERTEX_BUFFER_WRITE     5
-#define GEN6_DATAPORT_WRITE_MESSAGE_FLUSH_RENDER_CACHE               7
-
-#define GEN6_MATH_FUNCTION_INV                              1
-#define GEN6_MATH_FUNCTION_LOG                              2
-#define GEN6_MATH_FUNCTION_EXP                              3
-#define GEN6_MATH_FUNCTION_SQRT                             4
-#define GEN6_MATH_FUNCTION_RSQ                              5
-#define GEN6_MATH_FUNCTION_SIN                              6 /* was 7 */
-#define GEN6_MATH_FUNCTION_COS                              7 /* was 8 */
-#define GEN6_MATH_FUNCTION_SINCOS                           8 /* was 6 */
-#define GEN6_MATH_FUNCTION_TAN                              9
-#define GEN6_MATH_FUNCTION_POW                              10
-#define GEN6_MATH_FUNCTION_INT_DIV_QUOTIENT_AND_REMAINDER   11
-#define GEN6_MATH_FUNCTION_INT_DIV_QUOTIENT                 12
-#define GEN6_MATH_FUNCTION_INT_DIV_REMAINDER                13
-
-#define GEN6_MATH_INTEGER_UNSIGNED     0
-#define GEN6_MATH_INTEGER_SIGNED       1
-
-#define GEN6_MATH_PRECISION_FULL        0
-#define GEN6_MATH_PRECISION_PARTIAL     1
-
-#define GEN6_MATH_SATURATE_NONE         0
-#define GEN6_MATH_SATURATE_SATURATE     1
-
-#define GEN6_MATH_DATA_VECTOR  0
-#define GEN6_MATH_DATA_SCALAR  1
-
-#define GEN6_URB_OPCODE_WRITE  0
-
-#define GEN6_URB_SWIZZLE_NONE          0
-#define GEN6_URB_SWIZZLE_INTERLEAVE    1
-#define GEN6_URB_SWIZZLE_TRANSPOSE     2
-
-#define GEN6_SCRATCH_SPACE_SIZE_1K     0
-#define GEN6_SCRATCH_SPACE_SIZE_2K     1
-#define GEN6_SCRATCH_SPACE_SIZE_4K     2
-#define GEN6_SCRATCH_SPACE_SIZE_8K     3
-#define GEN6_SCRATCH_SPACE_SIZE_16K    4
-#define GEN6_SCRATCH_SPACE_SIZE_32K    5
-#define GEN6_SCRATCH_SPACE_SIZE_64K    6
-#define GEN6_SCRATCH_SPACE_SIZE_128K   7
-#define GEN6_SCRATCH_SPACE_SIZE_256K   8
-#define GEN6_SCRATCH_SPACE_SIZE_512K   9
-#define GEN6_SCRATCH_SPACE_SIZE_1M     10
-#define GEN6_SCRATCH_SPACE_SIZE_2M     11
-
-/* The hardware supports two different modes for border color. The
- * default (OpenGL) mode uses floating-point color channels, while the
- * legacy mode uses 4 bytes.
- *
- * More significantly, the legacy mode respects the components of the
- * border color for channels not present in the source, (whereas the
- * default mode will ignore the border color's alpha channel and use
- * alpha==1 for an RGB source, for example).
- *
- * The legacy mode matches the semantics specified by the Render
- * extension.
- */
-struct gen6_sampler_default_border_color {
-   float color[4];
-};
-
-struct gen6_sampler_legacy_border_color {
-   uint8_t color[4];
-};
-
-struct gen6_sampler_state {
-   struct {
-      uint32_t shadow_function:3;
-      uint32_t lod_bias:11;
-      uint32_t min_filter:3;
-      uint32_t mag_filter:3;
-      uint32_t mip_filter:2;
-      uint32_t base_level:5;
-      uint32_t pad:1;
-      uint32_t lod_preclamp:1;
-      uint32_t border_color_mode:1;
-      uint32_t pad0:1;
-      uint32_t disable:1;
-   } ss0;
-
-   struct {
-      uint32_t r_wrap_mode:3;
-      uint32_t t_wrap_mode:3;
-      uint32_t s_wrap_mode:3;
-      uint32_t pad:3;
-      uint32_t max_lod:10;
-      uint32_t min_lod:10;
-   } ss1;
-
-   struct {
-      uint32_t border_color;
-   } ss2;
-
-   struct {
-      uint32_t pad:19;
-      uint32_t max_aniso:3;
-      uint32_t chroma_key_mode:1;
-      uint32_t chroma_key_index:2;
-      uint32_t chroma_key_enable:1;
-      uint32_t monochrome_filter_width:3;
-      uint32_t monochrome_filter_height:3;
-   } ss3;
-};
-
-struct gen6_blend_state {
-	struct {
-		uint32_t dest_blend_factor:5;
-		uint32_t source_blend_factor:5;
-		uint32_t pad3:1;
-		uint32_t blend_func:3;
-		uint32_t pad2:1;
-		uint32_t ia_dest_blend_factor:5;
-		uint32_t ia_source_blend_factor:5;
-		uint32_t pad1:1;
-		uint32_t ia_blend_func:3;
-		uint32_t pad0:1;
-		uint32_t ia_blend_enable:1;
-		uint32_t blend_enable:1;
-	} blend0;
-
-	struct {
-		uint32_t post_blend_clamp_enable:1;
-		uint32_t pre_blend_clamp_enable:1;
-		uint32_t clamp_range:2;
-		uint32_t pad0:4;
-		uint32_t x_dither_offset:2;
-		uint32_t y_dither_offset:2;
-		uint32_t dither_enable:1;
-		uint32_t alpha_test_func:3;
-		uint32_t alpha_test_enable:1;
-		uint32_t pad1:1;
-		uint32_t logic_op_func:4;
-		uint32_t logic_op_enable:1;
-		uint32_t pad2:1;
-		uint32_t write_disable_b:1;
-		uint32_t write_disable_g:1;
-		uint32_t write_disable_r:1;
-		uint32_t write_disable_a:1;
-		uint32_t pad3:1;
-		uint32_t alpha_to_coverage_dither:1;
-		uint32_t alpha_to_one:1;
-		uint32_t alpha_to_coverage:1;
-	} blend1;
-};
-
-struct gen6_color_calc_state {
-	struct {
-		uint32_t alpha_test_format:1;
-		uint32_t pad0:14;
-		uint32_t round_disable:1;
-		uint32_t bf_stencil_ref:8;
-		uint32_t stencil_ref:8;
-	} cc0;
-
-	union {
-		float alpha_ref_f;
-		struct {
-			uint32_t ui:8;
-			uint32_t pad0:24;
-		} alpha_ref_fi;
-	} cc1;
-
-	float constant_r;
-	float constant_g;
-	float constant_b;
-	float constant_a;
-};
-
-struct gen6_depth_stencil_state {
-	struct {
-		uint32_t pad0:3;
-		uint32_t bf_stencil_pass_depth_pass_op:3;
-		uint32_t bf_stencil_pass_depth_fail_op:3;
-		uint32_t bf_stencil_fail_op:3;
-		uint32_t bf_stencil_func:3;
-		uint32_t bf_stencil_enable:1;
-		uint32_t pad1:2;
-		uint32_t stencil_write_enable:1;
-		uint32_t stencil_pass_depth_pass_op:3;
-		uint32_t stencil_pass_depth_fail_op:3;
-		uint32_t stencil_fail_op:3;
-		uint32_t stencil_func:3;
-		uint32_t stencil_enable:1;
-	} ds0;
-
-	struct {
-		uint32_t bf_stencil_write_mask:8;
-		uint32_t bf_stencil_test_mask:8;
-		uint32_t stencil_write_mask:8;
-		uint32_t stencil_test_mask:8;
-	} ds1;
-
-	struct {
-		uint32_t pad0:26;
-		uint32_t depth_write_enable:1;
-		uint32_t depth_test_func:3;
-		uint32_t pad1:1;
-		uint32_t depth_test_enable:1;
-	} ds2;
-};
-
-struct gen6_surface_state {
-	struct {
-		uint32_t cube_pos_z:1;
-		uint32_t cube_neg_z:1;
-		uint32_t cube_pos_y:1;
-		uint32_t cube_neg_y:1;
-		uint32_t cube_pos_x:1;
-		uint32_t cube_neg_x:1;
-		uint32_t pad:3;
-		uint32_t render_cache_read_mode:1;
-		uint32_t mipmap_layout_mode:1;
-		uint32_t vert_line_stride_ofs:1;
-		uint32_t vert_line_stride:1;
-		uint32_t color_blend:1;
-		uint32_t writedisable_blue:1;
-		uint32_t writedisable_green:1;
-		uint32_t writedisable_red:1;
-		uint32_t writedisable_alpha:1;
-		uint32_t surface_format:9;
-		uint32_t data_return_format:1;
-		uint32_t pad0:1;
-		uint32_t surface_type:3;
-	} ss0;
-
-	struct {
-		uint32_t base_addr;
-	} ss1;
-
-	struct {
-		uint32_t render_target_rotation:2;
-		uint32_t mip_count:4;
-		uint32_t width:13;
-		uint32_t height:13;
-	} ss2;
-
-	struct {
-		uint32_t tile_walk:1;
-		uint32_t tiled_surface:1;
-		uint32_t pad:1;
-		uint32_t pitch:18;
-		uint32_t depth:11;
-	} ss3;
-
-	struct {
-		uint32_t pad:19;
-		uint32_t min_array_elt:9;
-		uint32_t min_lod:4;
-	} ss4;
-
-	struct {
-		uint32_t pad:20;
-		uint32_t y_offset:4;
-		uint32_t pad2:1;
-		uint32_t x_offset:7;
-	} ss5;
-};
-
-struct gen6_cc_viewport {
-	float min_depth;
-	float max_depth;
-};
-
-typedef enum {
-	SAMPLER_FILTER_NEAREST = 0,
-	SAMPLER_FILTER_BILINEAR,
-	FILTER_COUNT
-} sampler_filter_t;
-
-typedef enum {
-	SAMPLER_EXTEND_NONE = 0,
-	SAMPLER_EXTEND_REPEAT,
-	SAMPLER_EXTEND_PAD,
-	SAMPLER_EXTEND_REFLECT,
-	EXTEND_COUNT
-} sampler_extend_t;
-
-#endif
-- 
1.7.8.3




More information about the Intel-gfx mailing list