mesa: Bump version to 10.2-rc2

Signed-off-by: Ian Romanick <ian.d.romanick@intel.com>
glx/tests: Partially revert commit 51e3569573
2014-05-09 20:02:02 -07:00 · 2014-05-09 18:33:27 -07:00 · 2014-05-09 18:33:22 -07:00 · 2014-05-09 18:32:57 -07:00 · 2014-05-09 18:32:39 -07:00 · 2014-05-09 18:31:29 -07:00
288 changed files with 1496 additions and 6915 deletions
--- a/Android.mk
+++ b/Android.mk
@@ -24,7 +24,7 @@
 # BOARD_GPU_DRIVERS should be defined.  The valid values are
 #
 #   classic drivers: i915 i965
-#   gallium drivers: swrast freedreno i915g ilo nouveau r300g r600g radeonsi vmwgfx
+#   gallium drivers: swrast i915g ilo nouveau r300g r600g radeonsi vmwgfx
 #
 # The main target is libGLES_mesa.  For each classic driver enabled, a DRI
 # module will also be built.  DRI modules will be loaded by libGLES_mesa.
@@ -42,7 +42,7 @@ DRM_TOP := external/drm
 DRM_GRALLOC_TOP := hardware/drm_gralloc

 classic_drivers := i915 i965
-gallium_drivers := swrast freedreno i915g ilo nouveau r300g r600g radeonsi vmwgfx
+gallium_drivers := swrast i915g ilo nouveau r300g r600g radeonsi vmwgfx

 MESA_GPU_DRIVERS := $(strip $(BOARD_GPU_DRIVERS))

--- a/Makefile.am
+++ b/Makefile.am
@@ -64,13 +64,14 @@ IGNORE_FILES = \

 parsers: configure
 	$(MAKE) -C src/glsl glsl_parser.cpp glsl_parser.h glsl_lexer.cpp glcpp/glcpp-lex.c glcpp/glcpp-parse.c glcpp/glcpp-parse.h
+	$(MAKE) -C src/mesa program/lex.yy.c program/program_parse.tab.c program/program_parse.tab.h

 # Everything for new a Mesa release:
 ARCHIVES = $(PACKAGE_NAME).tar.gz \
 	$(PACKAGE_NAME).tar.bz2 \
 	$(PACKAGE_NAME).zip

-tarballs: checksums
+tarballs: md5
 	rm -f ../$(PACKAGE_DIR) $(PACKAGE_NAME).tar

 manifest.txt: .git
@@ -97,9 +98,9 @@ $(PACKAGE_NAME).zip: parsers ../$(PACKAGE_DIR) manifest.txt
 	zip -q -@ $(PACKAGE_NAME).zip < $(PACKAGE_DIR)/manifest.txt ; \
 	mv $(PACKAGE_NAME).zip $(PACKAGE_DIR)

-checksums: $(ARCHIVES)
-	@-sha256sum $(PACKAGE_NAME).tar.gz
-	@-sha256sum $(PACKAGE_NAME).tar.bz2
-	@-sha256sum $(PACKAGE_NAME).zip
+md5: $(ARCHIVES)
+	@-md5sum $(PACKAGE_NAME).tar.gz
+	@-md5sum $(PACKAGE_NAME).tar.bz2
+	@-md5sum $(PACKAGE_NAME).zip

 .PHONY: tarballs md5
--- a/2
+++ b/2
@@ -1 +1 @@
-10.2.8
+10.2.0-rc2
--- a/bin/.cherry-ignore
+++ b/bin/.cherry-ignore
@@ -1,30 +0,0 @@
-# The first is the change, and the second is the revert of that change.
-e6967270c75a5b669152127bb7a746d55f4407a6 i965: Fix depth (array slices) computation for 1D_ARRAY render targets.
-155f98d49fdc2f46c760f8214327b3804ee60079 Revert "i965: Fix depth (array slices) computation for 1D_ARRAY render targets."
-
-# This patch didn't have enough in the commit message to convince me it
-# is a bug fix, (email sent to author asking for more information).
-41d759d076737f94976f5294b734dbc437a12bae
-
-# These patch were already cherry-picked before the 10.2.4 release.
-#
-# But get-pick-list.sh doesn't realize that because the commit messages for
-# these on the stable branch reference commit IDs that don't actually appear
-# on master. I'm not sure what happened, (perhaps master was force-pushed at
-# some point?).
-2eaf3f670fea4ce4466340141244e41a45542c13
-e5adc560cc8544200faa3e04504202839626ab37
-cf1b5eee7f36af29d1d5caba3538ad4985e51f81
-
-# The patch depends on earlier ones that are not part of 10.2.
-b3121bfd413973f460e2cc9a9f852bdfa1265fcf mesa: guard better when building with sse4.1 optimisations
-
-# The PIPE_CAP is not in mesa 10.2 - breaks the build.
-72969e0efb7a5a011629c1001e81aa2329ede6b1 radeon/compute: Report a value for PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
-
-# No whitespace fixes for the stable branches.
-38fccc37c1fa57c1fd373e8d71621bb4aed31083 radeonsi/compute: Whitespace fixes
-
-# The commit relies of patches restructuring r600_resource, which never made
-# it in the 10.2 branch.
-a15088338ebe544efd90bfa7934cb99521488141 radeonsi/compute: Stop leaking the input buffer
--- a/bin/get-pick-list.sh
+++ b/bin/get-pick-list.sh
@@ -14,7 +14,7 @@ git log --reverse --grep="cherry picked from commit" origin/master..HEAD |\
 	sed -e 's/^[[:space:]]*(cherry picked from commit[[:space:]]*//' -e 's/)//' > already_picked

 # Grep for commits that were marked as a candidate for the stable tree.
-git log --reverse --pretty=%H -i --grep='^\([[:space:]]*NOTE: .*[Cc]andidate\|CC:.*10\.2.*mesa-stable\)' HEAD..origin/master |\
+git log --reverse --pretty=%H -i --grep='^\([[:space:]]*NOTE: .*[Cc]andidate\|CC:.*mesa-stable\)' HEAD..origin/master |\
 while read sha
 do
 	# Check to see whether the patch is on the ignore list.
--- a/configure.ac
+++ b/configure.ac
@@ -331,19 +331,6 @@ LDFLAGS=$save_LDFLAGS

 AC_SUBST([GC_SECTIONS])

-dnl
-dnl OpenBSD does not have DT_NEEDED entries for libc by design
-dnl so when these flags are passed to ld via libtool the checks will fail
-dnl
-case "$host_os" in
-openbsd*)
-    LD_NO_UNDEFINED="" ;;
-*)
-    LD_NO_UNDEFINED="-Wl,--no-undefined" ;;
-esac
-
-AC_SUBST([LD_NO_UNDEFINED])
-
 dnl
 dnl compatibility symlinks
 dnl
@@ -494,10 +481,10 @@ AC_CHECK_FUNC([dlopen], [DEFINES="$DEFINES -DHAVE_DLOPEN"],
 AC_SUBST([DLOPEN_LIBS])

 dnl Check if that library also has dladdr
-save_LIBS="$LIBS"
-LIBS="$LIBS $DLOPEN_LIBS"
+save_LDFLAGS="$LDFLAGS"
+LDFLAGS="$LDFLAGS $DLOPEN_LIBS"
 AC_CHECK_FUNCS([dladdr])
-LIBS="$save_LIBS"
+LDFLAGS="$save_LDFLAGS"

 case "$host_os" in
 darwin*|mingw*)
@@ -1273,10 +1260,6 @@ if test "x$enable_gallium_gbm" = xyes; then
        AC_MSG_ERROR([gbm_gallium requires --enable-dri to build])
    fi

-    if test "x$enable_gallium_egl" != xyes; then
-        AC_MSG_ERROR([gbm_gallium is only used by egl_gallium])
-    fi
-
    GALLIUM_STATE_TRACKERS_DIRS="gbm $GALLIUM_STATE_TRACKERS_DIRS"
    GALLIUM_TARGET_DIRS="$GALLIUM_TARGET_DIRS gbm"
    enable_gallium_loader=yes
@@ -1297,7 +1280,6 @@ if test "x$enable_xa" = xyes; then
    fi
    GALLIUM_STATE_TRACKERS_DIRS="xa $GALLIUM_STATE_TRACKERS_DIRS"
    enable_gallium_loader=yes
-    enable_gallium_drm_loader=yes
 fi
 AM_CONDITIONAL(HAVE_ST_XA, test "x$enable_xa" = xyes)

@@ -1328,7 +1310,7 @@ AM_CONDITIONAL(HAVE_OPENVG, test "x$enable_openvg" = xyes)
 dnl
 dnl Gallium G3DVL configuration
 dnl
-if test -n "$with_gallium_drivers" -a "x$with_gallium_drivers" != xswrast; then
+if test -n "$with_gallium_drivers" && ! echo "$with_gallium_drivers" | grep -q 'swrast'; then
    if test "x$enable_xvmc" = xauto; then
 	PKG_CHECK_EXISTS([xvmc], [enable_xvmc=yes], [enable_xvmc=no])
    fi
@@ -1583,7 +1565,6 @@ strip_unwanted_llvm_flags() {
    # Use \> (marks the end of the word)
    echo `$1` | sed \
 	-e 's/-DNDEBUG\>//g' \
-	-e 's/-D_GNU_SOURCE\>//g' \
 	-e 's/-pedantic\>//g' \
 	-e 's/-Wcovered-switch-default\>//g' \
 	-e 's/-O.\>//g' \
@@ -1678,10 +1659,6 @@ if test "x$enable_gallium_llvm" = xyes; then
 else
    MESA_LLVM=0
    LLVM_VERSION_INT=0
-
-    if test "x$enable_opencl" = xyes; then
-        AC_MSG_ERROR([cannot enable OpenCL without LLVM])
-    fi
 fi

 dnl Directory for XVMC libs
@@ -1762,7 +1739,6 @@ gallium_check_st() {

 gallium_require_llvm() {
    if test "x$MESA_LLVM" = x0; then
-        case "$host" in *gnux32) return;; esac
        case "$host_cpu" in
        i*86|x86_64|amd64) AC_MSG_ERROR([LLVM is required to build $1 on x86 and x86_64]);;
        esac
@@ -1815,9 +1791,6 @@ if test -n "$with_gallium_drivers"; then
        case "x$driver" in
        xsvga)
            HAVE_GALLIUM_SVGA=yes
-            if test "x$have_libdrm" != xyes; then
-                AC_MSG_ERROR([Building svga requires libdrm >= $LIBDRM_REQUIRED])
-            fi
            GALLIUM_DRIVERS_DIRS="$GALLIUM_DRIVERS_DIRS svga softpipe"
            gallium_require_drm_loader
            gallium_check_st "svga/drm" "dri-vmwgfx" ""
--- a/docs/index.html
+++ b/docs/index.html
@@ -16,20 +16,6 @@

 <h1>News</h1>

-<h2>June 6, 2014</h2>
-<p>
-<a href="relnotes/10.2.1.html">Mesa 10.2.1</a> is released.  This release
-only fixes a build error in the radeonsi driver that was introduced between
-10.2-rc5 and the 10.2 final release.
-</p>
-
-<h2>June 6, 2014</h2>
-<p>
-<a href="relnotes/10.2.html">Mesa 10.2</a> is released.  This is a new
-development release.  See the release notes for more information about
-the release.
-</p>
-
 <h2>April 18, 2014</h2>
 <p>
 <a href="relnotes/10.1.1.html">Mesa 10.1.1</a> is released.
--- a/docs/relnotes.html
+++ b/docs/relnotes.html
@@ -21,8 +21,6 @@ The release notes summarize what's new or changed in each Mesa release.
 </p>

 <ul>
-<li><a href="relnotes/10.2.1.html">10.2.1 release notes</a>
-<li><a href="relnotes/10.2.html">10.2 release notes</a>
 <li><a href="relnotes/10.1.1.html">10.1.1 release notes</a>
 <li><a href="relnotes/10.1.html">10.1 release notes</a>
 <li><a href="relnotes/10.0.5.html">10.0.5 release notes</a>
--- a/docs/relnotes/10.2.1.html
+++ b/docs/relnotes/10.2.1.html
@@ -1,61 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.1 Release Notes / June 6, 2014</h1>
-
-<p>
-Mesa 10.2.1 is a bug fix release which fixes bugs found since the 10.1 release.
-</p>
-<p>
-Mesa 10.2.1 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-
-<h2>MD5 checksums</h2>
-<pre>
-96f892dae2d0bb14ac9c2113f586c909  MesaLib-10.2.1.tar.gz
-093f9b5d077e5f6061dcd7b01b7aa51a  MesaLib-10.2.1.tar.bz2
-6ab76c1608e5deed1eb8b54c62d7a48a  MesaLib-10.2.1.zip
-</pre>
-
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>
-Mesa 10.2 had a build problem in the radeonsi driver due to an error resolving
-conflicts in a patch cherry-pick from master.  The build error is fixed.
-</p>
-
-<h2>Changes</h2>
-
-<p>Ian Romanick (3):</p>
-<ul>
-  <li>docs: Add MD5 checksum, etc. for 10.1 release</li>
-  <li>radeonsi: Fix build error introduced in 5ab9a9c</li>
-  <li>Bump version to 10.2.1</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.2.html
+++ b/docs/relnotes/10.2.2.html
@@ -1,181 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.2 Release Notes / June 24, 2014</h1>
-
-<p>
-Mesa 10.2.2 is a bug fix release which fixes bugs found since the 10.2.1 release.
-</p>
-<p>
-Mesa 10.2.2 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-
-<h2>SHA256 checksums</h2>
-<pre>
-38c4a40364000f89cddaa1694f6f3cfb444981d1110238ce603093585477399c  MesaLib-10.2.2.tar.bz2
-2af2ec8b4db624c352e961eefbcce6c8d1f86d44c5542f6f378c50e1b958d453  MesaLib-10.2.2.tar.gz
-d4c0372da59367a344d62ebcdf5cf61039c9cae6925f40f2dab8f8d95cf22da9  MesaLib-10.2.2.zip
-</pre>
-
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=54372">Bug 54372</a> - GLX_INTEL_swap_event crashes driver when swapping window buffers</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=66452">Bug 66452</a> - JUNIPER UVD accelerated playback of WMV3 streams does not work</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=74005">Bug 74005</a> - [i965 Bisected]Piglit/glx_glx-make-glxdrawable-current fails</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=77865">Bug 77865</a> - [BDW] Many Ogles3conform framebuffer_blit cases fail</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=78581">Bug 78581</a> - OpenCL: clBuildProgram prints error messages directly rather than storing them</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=79029">Bug 79029</a> - INTEL_DEBUG=shader_time is full of lies</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=79729">Bug 79729</a> - [i965] glClear on a multisample texture doesn't work</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=79907">Bug 79907</a> - Mesa 10.2.1 --enable-vdpau default=auto broken</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=80115">Bug 80115</a> - MESA_META_DRAW_BUFFERS induced GL_INVALID_VALUE errors</li>
-
-</ul>
-
-
-<h2>Changes</h2>
-
-<p>Adrian Negreanu (8):</p>
-<ul>
-  <li>add megadriver_stub_FILES</li>
-  <li>android: adapt to the megadriver mechanism</li>
-  <li>android: add libloader to libGLES_mesa and libmesa_egl_dri2</li>
-  <li>android: add src/gallium/auxiliary as include path for libmesa_dricore</li>
-  <li>android, egl: add correct drm include for libmesa_egl_dri2</li>
-  <li>android, egl: typo dri2_fallback_pixmap_surface -&gt; dri2_fallback_create_pixmap_surface</li>
-  <li>android, mesa_gen_matypes: pull in timespec POSIX definition</li>
-  <li>android, dricore: undefined reference to _mesa_streaming_load_memcpy</li>
-</ul>
-
-<p>Carl Worth (1):</p>
-<ul>
-  <li>Update VERSION to 10.2.2</li>
-</ul>
-
-<p>Daniel Manjarres (1):</p>
-<ul>
-  <li>glx: Don't crash on swap event for a Window (non-GLXWindow)</li>
-</ul>
-
-<p>Emil Velikov (3):</p>
-<ul>
-  <li>targets/xa: limit the amount of exported symbols</li>
-  <li>configure: error out when building opencl without LLVM</li>
-  <li>configure: correctly autodetect xvmc/vdpau/omx</li>
-</ul>
-
-<p>Grigori Goronzy (1):</p>
-<ul>
-  <li>radeon/uvd: disable VC-1 simple/main on UVD 2.x</li>
-</ul>
-
-<p>Iago Toral Quiroga (1):</p>
-<ul>
-  <li>mesa: Copy Geom.UsesEndPrimitive when cloning a geometry program.</li>
-</ul>
-
-<p>Ian Romanick (3):</p>
-<ul>
-  <li>docs: Add initial 10.2.1 release notes</li>
-  <li>docs: Add MD5 checksum, etc. for 10.2.1 release</li>
-  <li>meta: Respect the driver's maximum number of draw buffers</li>
-</ul>
-
-<p>Ilia Mirkin (7):</p>
-<ul>
-  <li>gk110/ir: emit saturate flag on fadd when needed</li>
-  <li>gk110/ir: fix emitting constbuf file index</li>
-  <li>gk110/ir: fix bfind emission</li>
-  <li>nv50: make sure to mark first scissor dirty after blit</li>
-  <li>nv30: plug some memory leaks on screen destroy and shader compile</li>
-  <li>nv30: avoid dangling references to deleted contexts</li>
-  <li>nv30: hack to avoid errors on unexpected color/zeta combinations</li>
-</ul>
-
-<p>Jason Ekstrand (1):</p>
-<ul>
-  <li>meta_blit: properly compute texture width for the CopyTexSubImage fallback</li>
-</ul>
-
-<p>José Fonseca (1):</p>
-<ul>
-  <li>mesa/main: Prevent sefgault on glGetIntegerv(GL_ATOMIC_COUNTER_BUFFER_BINDING).</li>
-</ul>
-
-<p>Kenneth Graunke (9):</p>
-<ul>
-  <li>i965: Don't use the head sentinel as an fs_inst in Gen4 workaround code.</li>
-  <li>i965: Invalidate live intervals when inserting Gen4 SEND workarounds.</li>
-  <li>i965/vec4: Fix dead code elimination for VGRFs of size &gt; 1.</li>
-  <li>i965: Add missing MOCS setup for 3DSTATE_INDEX_BUFFER on Broadwell.</li>
-  <li>i965: Drop Broadwell perf_debugs about missing MOCS that aren't missing.</li>
-  <li>i965: Add missing newlines to a few perf_debug messages.</li>
-  <li>i965/vec4: Use the sampler for pull constant loads on Broadwell.</li>
-  <li>i965: Use 8x4 aligned rectangles for HiZ operations on Broadwell.</li>
-  <li>i965: Save meta stencil blit programs in the context.</li>
-</ul>
-
-<p>Kristian Høgsberg (1):</p>
-<ul>
-  <li>mesa: Remove glClear optimization based on drawable size</li>
-</ul>
-
-<p>Michel Dänzer (1):</p>
-<ul>
-  <li>configure: Only check for OpenCL without LLVM when the latter is certain</li>
-</ul>
-
-<p>Neil Roberts (1):</p>
-<ul>
-  <li>i965: Set the fast clear color value for texture surfaces</li>
-</ul>
-
-<p>Tom Stellard (2):</p>
-<ul>
-  <li>clover: Prevent Clang from printing number of errors and warnings to stderr.</li>
-  <li>clover: Don't use llvm's global context</li>
-</ul>
-
-<p>Ville Syrjälä (1):</p>
-<ul>
-  <li>i915: Fix gen2 texblend setup</li>
-</ul>
-
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.3.html
+++ b/docs/relnotes/10.2.3.html
@@ -1,130 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.3 Release Notes / July 7, 2014</h1>
-
-<p>
-Mesa 10.2.3 is a bug fix release which fixes bugs found since the 10.2.2 release.
-</p>
-<p>
-Mesa 10.2.3 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-
-<h2>SHA256 checksums</h2>
-<pre>
-e482a96170c98b17d6aba0d6e4dda4b9a2e61c39587bb64ac38cadfa4aba4aeb  MesaLib-10.2.3.tar.bz2
-96cffacaa1c52ae659b3b0f91be2eebf5528b748934256751261fb79ea3d6636  MesaLib-10.2.3.tar.gz
-82cab6ff14c8038ee39842dbdea0d447a78d119efd8d702d1497bc7c246434e9  MesaLib-10.2.3.zip
-</pre>
-
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=76223">Bug 76223</a> - </li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=79823">Bug 79823</a> - </li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=80015">Bug 80015</a> - </li>
-
-</ul>
-
-<h2>Changes</h2>
-
-<p>Aaron Watry (1):</p>
-<ul>
-  <li>radeon/llvm: Allocate space for kernel metadata operands</li>
-</ul>
-
-<p>Carl Worth (2):</p>
-<ul>
-  <li>docs: Add sha256 sums for the 10.2.2 release</li>
-  <li>cherry-ignore: Add a patch that's been rejected</li>
-</ul>
-
-<p>Ilia Mirkin (4):</p>
-<ul>
-  <li>nouveau: dup fd before passing it to device</li>
-  <li>nv50: disable dedicated ubo upload method</li>
-  <li>nv50: do an explicit flush on draw when there are persistent buffers</li>
-  <li>nvc0: add a memory barrier when there are persistent UBOs</li>
-</ul>
-
-<p>Jasper St. Pierre (1):</p>
-<ul>
-  <li>glxext: Send the Drawable's ID in the GLX_BufferSwapComplete event</li>
-</ul>
-
-<p>Kenneth Graunke (3):</p>
-<ul>
-  <li>i965: Don't emit SURFACE_STATEs for gather workarounds on Broadwell.</li>
-  <li>i965: Include marketing names for Broadwell GPUs.</li>
-  <li>i965/disasm: Fix INTEL_DEBUG=fs on Broadwell for ARB_fp applications.</li>
-</ul>
-
-<p>Michel Dänzer (1):</p>
-<ul>
-  <li>radeon/llvm: Use the llvm.rsq.clamped intrinsic for RSQ</li>
-</ul>
-
-<p>Rob Clark (9):</p>
-<ul>
-  <li>xa: fix segfault</li>
-  <li>freedreno: use OUT_RELOCW when buffer is written</li>
-  <li>freedreno/a3xx: fix depth/stencil GMEM positioning</li>
-  <li>freedreno/a3xx: fix depth/stencil gmem restore</li>
-  <li>freedreno/a3xx: fix blend opcode</li>
-  <li>freedreno: few caps fixes</li>
-  <li>freedreno/a3xx: texture fixes</li>
-  <li>freedreno: fix for null textures</li>
-  <li>freedreno/a3xx: vtx formats</li>
-</ul>
-
-<p>Roland Scheidegger (1):</p>
-<ul>
-  <li>draw: (trivial) fix clamping of viewport index</li>
-</ul>
-
-<p>Takashi Iwai (1):</p>
-<ul>
-  <li>llvmpipe: Fix zero-division in llvmpipe_texture_layout()</li>
-</ul>
-
-<p>Thomas Hellstrom (1):</p>
-<ul>
-  <li>st/xa: Don't close the drm fd on failure v2</li>
-</ul>
-
-<p>Tobias Klausmann (1):</p>
-<ul>
-  <li>nv50/ir: allow gl_ViewportIndex to work on non-provoking vertices</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.4.html
+++ b/docs/relnotes/10.2.4.html
@@ -1,127 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.4 Release Notes / July 18, 2014</h1>
-
-<p>
-Mesa 10.2.4 is a bug fix release which fixes bugs found since the 10.2.3 release.
-</p>
-<p>
-Mesa 10.2.4 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-
-<h2>SHA256 checksums</h2>
-<pre>
-06a2341244eb85c283f59f70161e06ded106f835ed9b6be1ef0243bd9344811a  MesaLib-10.2.4.tar.bz2
-33e3c8b4343503e7d7d17416c670438860a2fd99ec93ea3327f73c3abe33b5e4  MesaLib-10.2.4.tar.gz
-e26791a4a62a61b82e506e6ba031812d09697d1a831e8239af67e5722a8ee538  MesaLib-10.2.4.zip
-</pre>
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=81157">Bug 81157</a> - [BDW]Piglit some spec_glsl-1.50_execution_built-in-functions* cases fail</li>
-
-</ul>
-
-<h2>Changes</h2>
-
-<p>Abdiel Janulgue (3):</p>
-<ul>
-  <li>i965/fs: Refactor check for potential copy propagated instructions.</li>
-  <li>i965/fs: skip copy-propate for logical instructions with negated src entries</li>
-  <li>i965/vec4: skip copy-propate for logical instructions with negated src entries</li>
-</ul>
-
-<p>Brian Paul (3):</p>
-<ul>
-  <li>mesa: fix geometry shader memory leaks</li>
-  <li>st/mesa: fix geometry shader memory leak</li>
-  <li>gallium/u_blitter: fix some shader memory leaks</li>
-</ul>
-
-<p>Carl Worth (2):</p>
-<ul>
-  <li>docs: Add sha256 checksums for the 10.2.3 release</li>
-  <li>Update VERSION to 10.2.4</li>
-</ul>
-
-<p>Eric Anholt (1):</p>
-<ul>
-  <li>i965: Generalize the pixel_x/y workaround for all UW types.</li>
-</ul>
-
-<p>Ilia Mirkin (4):</p>
-<ul>
-  <li>nv50/ir: retrieve shadow compare from first arg</li>
-  <li>nv50/ir: ignore bias for samplerCubeShadow on nv50</li>
-  <li>nvc0/ir: do quadops on the right texture coordinates for TXD</li>
-  <li>nvc0/ir: use manual TXD when offsets are involved</li>
-</ul>
-
-<p>Jordan Justen (1):</p>
-<ul>
-  <li>i965: Add auxiliary surface field #defines for Broadwell.</li>
-</ul>
-
-<p>Kenneth Graunke (9):</p>
-<ul>
-  <li>i965: Don't copy propagate abs into Broadwell logic instructions.</li>
-  <li>i965: Set execution size to 8 for instructions with force_sechalf set.</li>
-  <li>i965/fs: Set force_uncompressed and force_sechalf on samplepos setup.</li>
-  <li>i965/fs: Use WE_all for gl_SampleID header register munging.</li>
-  <li>i965: Add plumbing for Broadwell's auxiliary surface support.</li>
-  <li>i965: Drop SINT workaround for CMS layout on Broadwell.</li>
-  <li>i965: Hook up the MCS buffers in SURFACE_STATE on Broadwell.</li>
-  <li>i965: Add 2x MSAA support to the MCS allocation function.</li>
-  <li>i965: Enable compressed multisample support (CMS) on Broadwell.</li>
-</ul>
-
-<p>Marek Olšák (4):</p>
-<ul>
-  <li>gallium: fix u_default_transfer_inline_write for textures</li>
-  <li>st/mesa: fix samplerCubeShadow with bias</li>
-  <li>radeonsi: fix samplerCubeShadow with bias</li>
-  <li>radeonsi: add support for TXB2</li>
-</ul>
-
-<p>Matt Turner (8):</p>
-<ul>
-  <li>i965/vec4: Don't return void from a void function.</li>
-  <li>i965/vec4: Don't fix_math_operand() on Gen &gt;= 8.</li>
-  <li>i965/fs: Don't fix_math_operand() on Gen &gt;= 8.</li>
-  <li>i965/fs: Make try_constant_propagate() static.</li>
-  <li>i965/fs: Constant propagate into 2-src math instructions on Gen8.</li>
-  <li>i965/vec4: Constant propagate into 2-src math instructions on Gen8.</li>
-  <li>i965/fs: Don't use brw_imm_* unnecessarily.</li>
-  <li>i965/fs: Set correct number of regs_written for MCS fetches.</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.5.html
+++ b/docs/relnotes/10.2.5.html
@@ -1,188 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.5 Release Notes / August 2, 2014</h1>
-
-<p>
-Mesa 10.2.5 is a bug fix release which fixes bugs found since the 10.2.4 release.
-</p>
-<p>
-Mesa 10.2.5 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-<h2>SHA256 checksums</h2>
-<pre>
-b4459f0bf7f4a3c8fb78ece3c9d2eac3d0e5bf38cb470f2a72705e744bd0310d  MesaLib-10.2.5.tar.bz2
-7b4dd0cb683f8c7dc48a3e7a315742bed58ddcd7b756c462aca4177bd1acdc79  MesaLib-10.2.5.tar.gz
-6180565914fb238dd77ccdaff96b6155d9a6e1b3e981ebbf6a6851301b384fed  MesaLib-10.2.5.zip
-</pre>
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=80991">Bug 80991</a> - [BDW]Piglit spec_ARB_sample_shading_builtin-gl-sample-mask_2 fails</li>
-
-</ul>
-
-<h2>Changes</h2>
-
-<p>Abdiel Janulgue (3):</p>
-<ul>
-  <li>i965/fs: Refactor check for potential copy propagated instructions.</li>
-  <li>i965/fs: skip copy-propate for logical instructions with negated src entries</li>
-  <li>i965/vec4: skip copy-propate for logical instructions with negated src entries</li>
-</ul>
-
-<p>Adel Gadllah (1):</p>
-<ul>
-  <li>i915: Fix up intelInitScreen2 for DRI3</li>
-</ul>
-
-<p>Anuj Phogat (2):</p>
-<ul>
-  <li>i965: Fix z_offset computation in intel_miptree_unmap_depthstencil()</li>
-  <li>mesa: Don't use memcpy() in _mesa_texstore() for float depth texture data</li>
-</ul>
-
-<p>Brian Paul (3):</p>
-<ul>
-  <li>mesa: fix geometry shader memory leaks</li>
-  <li>st/mesa: fix geometry shader memory leak</li>
-  <li>gallium/u_blitter: fix some shader memory leaks</li>
-</ul>
-
-<p>Carl Worth (6):</p>
-<ul>
-  <li>docs: Add sha256 checksums for the 10.2.3 release</li>
-  <li>Update VERSION to 10.2.4</li>
-  <li>Add release notes for 10.2.4</li>
-  <li>docs: Add SHA256 checksums for the 10.2.4 release</li>
-  <li>cherry-ignore: Ignore a few patches picked in the previous stable release</li>
-  <li>Update version to 10.2.5</li>
-</ul>
-
-<p>Christian König (1):</p>
-<ul>
-  <li>radeonsi: fix order of r600_need_dma_space and r600_context_bo_reloc</li>
-</ul>
-
-<p>Eric Anholt (1):</p>
-<ul>
-  <li>i965: Generalize the pixel_x/y workaround for all UW types.</li>
-</ul>
-
-<p>Ian Romanick (2):</p>
-<ul>
-  <li>mesa: Don't allow GL_TEXTURE_BORDER queries outside compat profile</li>
-  <li>mesa: Don't allow GL_TEXTURE_{LUMINANCE,INTENSITY}_* queries outside compat profile</li>
-</ul>
-
-<p>Ilia Mirkin (5):</p>
-<ul>
-  <li>nv50/ir: retrieve shadow compare from first arg</li>
-  <li>nv50/ir: ignore bias for samplerCubeShadow on nv50</li>
-  <li>nvc0/ir: do quadops on the right texture coordinates for TXD</li>
-  <li>nvc0/ir: use manual TXD when offsets are involved</li>
-  <li>nvc0: make sure that the local memory allocation is aligned to 0x10</li>
-</ul>
-
-<p>Jason Ekstrand (2):</p>
-<ul>
-  <li>main/format_pack: Fix a wrong datatype in pack_ubyte_R8G8_UNORM</li>
-  <li>main/get_hash_params: Add GL_SAMPLE_SHADING_ARB</li>
-</ul>
-
-<p>Jordan Justen (1):</p>
-<ul>
-  <li>i965: Add auxiliary surface field #defines for Broadwell.</li>
-</ul>
-
-<p>José Fonseca (1):</p>
-<ul>
-  <li>st/wgl: Clamp wglChoosePixelFormatARB's output nNumFormats to nMaxFormats.</li>
-</ul>
-
-<p>Kenneth Graunke (13):</p>
-<ul>
-  <li>i965: Don't copy propagate abs into Broadwell logic instructions.</li>
-  <li>i965: Set execution size to 8 for instructions with force_sechalf set.</li>
-  <li>i965/fs: Set force_uncompressed and force_sechalf on samplepos setup.</li>
-  <li>i965/fs: Use WE_all for gl_SampleID header register munging.</li>
-  <li>i965: Add plumbing for Broadwell's auxiliary surface support.</li>
-  <li>i965: Drop SINT workaround for CMS layout on Broadwell.</li>
-  <li>i965: Hook up the MCS buffers in SURFACE_STATE on Broadwell.</li>
-  <li>i965: Add 2x MSAA support to the MCS allocation function.</li>
-  <li>i965: Enable compressed multisample support (CMS) on Broadwell.</li>
-  <li>i965: Add missing persample_shading field to brw_wm_debug_recompile.</li>
-  <li>i965/fs: Fix gl_SampleID for 2x MSAA and SIMD16 mode.</li>
-  <li>i965/fs: Fix gl_SampleMask handling for SIMD16 on Gen8+.</li>
-  <li>i965/fs: Set LastRT on the final FB write on Broadwell.</li>
-</ul>
-
-<p>Marek Olšák (14):</p>
-<ul>
-  <li>gallium: fix u_default_transfer_inline_write for textures</li>
-  <li>st/mesa: fix samplerCubeShadow with bias</li>
-  <li>radeonsi: fix samplerCubeShadow with bias</li>
-  <li>radeonsi: add support for TXB2</li>
-  <li>r600g: switch SNORM conversion to DX and GLES behavior</li>
-  <li>radeonsi: fix CMASK and HTILE calculations for Hawaii</li>
-  <li>gallium/util: add a helper for calculating primitive count from vertex count</li>
-  <li>radeonsi: fix a hang with instancing on Hawaii</li>
-  <li>radeonsi: fix a hang with streamout on Hawaii</li>
-  <li>winsys/radeon: fix vram_size overflow with Hawaii</li>
-  <li>radeonsi: fix occlusion queries on Hawaii</li>
-  <li>r600g,radeonsi: switch all occurences of array_size to util_max_layer</li>
-  <li>radeonsi: fix build because of lack of draw_indirect infrastructure in 10.2</li>
-  <li>radeonsi: use DRAW_PREAMBLE on CIK</li>
-</ul>
-
-<p>Matt Turner (8):</p>
-<ul>
-  <li>i965/vec4: Don't return void from a void function.</li>
-  <li>i965/vec4: Don't fix_math_operand() on Gen &gt;= 8.</li>
-  <li>i965/fs: Don't fix_math_operand() on Gen &gt;= 8.</li>
-  <li>i965/fs: Make try_constant_propagate() static.</li>
-  <li>i965/fs: Constant propagate into 2-src math instructions on Gen8.</li>
-  <li>i965/vec4: Constant propagate into 2-src math instructions on Gen8.</li>
-  <li>i965/fs: Don't use brw_imm_* unnecessarily.</li>
-  <li>i965/fs: Set correct number of regs_written for MCS fetches.</li>
-</ul>
-
-<p>Thorsten Glaser (1):</p>
-<ul>
-  <li>nv50: fix build failure on m68k due to invalid struct alignment assumptions</li>
-</ul>
-
-<p>Tom Stellard (1):</p>
-<ul>
-  <li>clover: Call end_query before getting timestamp result v2</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.6.html
+++ b/docs/relnotes/10.2.6.html
@@ -1,118 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.6 Release Notes / August 19, 2014</h1>
-
-<p>
-Mesa 10.2.6 is a bug fix release which fixes bugs found since the 10.2.5 release.
-</p>
-<p>
-Mesa 10.2.6 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-<h2>SHA256 checksums</h2>
-<pre>
-193314d2adba98e43697d726739ac46b4299aae324fa1821aa226890c28ac806  MesaLib-10.2.6.tar.bz2
-f7a45a5977b485eb95ac024205c584a0c112fe3951c2313c797579bb16a7a448  MesaLib-10.2.6.tar.gz
-6d086d6fcda8f317adfaaae40011decf2f2e2dc80819c4a7a77c76f73512e8d8  MesaLib-10.2.6.zip
-</pre>
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=81450">Bug 81450</a> - [BDW]Piglit spec_glsl-1.30_execution_tex-miplevel-selection_textureGrad_1DArray cases intel_do_flush_locked failed</li>
-
-</ul>
-
-<h2>Changes</h2>
-
-<p>Anuj Phogat (15):</p>
-<ul>
-  <li>mesa: Fix error condition for valid texture targets in glTexStorage* functions</li>
-  <li>mesa: Turn target_can_be_compressed() in to a utility function</li>
-  <li>mesa: Add error condition for using compressed internalformat in glTexStorage3D()</li>
-  <li>mesa: Fix condition for using compressed internalformat in glCompressedTexImage3D()</li>
-  <li>mesa: Add utility function _mesa_is_enum_format_snorm()</li>
-  <li>mesa: Don't allow snorm internal formats in glCopyTexImage*() in GLES3</li>
-  <li>mesa: Add a helper function _mesa_is_enum_format_unsized()</li>
-  <li>mesa: Add a gles3 error condition for sized internalformat in glCopyTexImage*()</li>
-  <li>mesa: Add gles3 error condition for GL_RGBA10_A2 buffer format in glCopyTexImage*()</li>
-  <li>mesa: Add utility function _mesa_is_enum_format_unorm()</li>
-  <li>mesa: Add gles3 condition for normalized internal formats in glCopyTexImage*()</li>
-  <li>mesa: Allow GL_TEXTURE_CUBE_MAP target with compressed internal formats</li>
-  <li>meta: Use _mesa_get_format_bits() to get the GL_RED_BITS</li>
-  <li>egl: Fix OpenGL ES version checks in _eglParseContextAttribList()</li>
-  <li>meta: Fix datatype computation in get_temp_image_type()</li>
-</ul>
-
-<p>Brian Paul (1):</p>
-<ul>
-  <li>mesa: fix assertion in _mesa_drawbuffers()</li>
-</ul>
-
-<p>Carl Worth (2):</p>
-<ul>
-  <li>docs: Add sha256 sums to the 10.2.5 release notes</li>
-  <li>Update VERSION to 10.2.6</li>
-</ul>
-
-<p>Ilia Mirkin (1):</p>
-<ul>
-  <li>mesa/st: only convert AND(a, NOT(b)) into MAD when not using native integers</li>
-</ul>
-
-<p>Jordan Justen (1):</p>
-<ul>
-  <li>i965/miptree: Layout 1D Array as 2D Array with height of 1</li>
-</ul>
-
-<p>Maarten Lankhorst (1):</p>
-<ul>
-  <li>configure.ac: Do not require llvm on x32</li>
-</ul>
-
-<p>Marek Olšák (4):</p>
-<ul>
-  <li>st/mesa: fix blit-based partial TexSubImage for 1D arrays</li>
-  <li>radeon,r200: fix buffer validation after CS flush</li>
-  <li>radeonsi: fix a hang with instancing in Unigine Heaven/Valley on Hawaii</li>
-  <li>radeonsi: fix CMASK and HTILE allocation on Tahiti</li>
-</ul>
-
-<p>Pali Rohár (1):</p>
-<ul>
-  <li>configure: check for dladdr via AC_CHECK_FUNC/AC_CHECK_LIB</li>
-</ul>
-
-<p>Roland Scheidegger (1):</p>
-<ul>
-  <li>gallivm: fix up out-of-bounds level when using conformant out-of-bound behavior</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.7.html
+++ b/docs/relnotes/10.2.7.html
@@ -1,211 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.7 Release Notes / September 06, 2014</h1>
-
-<p>
-Mesa 10.2.7 is a bug fix release which fixes bugs found since the 10.2.6 release.
-</p>
-<p>
-Mesa 10.2.7 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-<h2>SHA256 checksums</h2>
-<pre>
-cb67dfaabf88acba29aa2cf0dd58ee17b21ebf9594f8d1226c41794da8de3e9d  MesaLib-10.2.7.tar.gz
-27b958063a4c002071f14ed45c7d2a1ee52cd85e4ac8876e8a1c273495a7d43f  MesaLib-10.2.7.tar.bz2
-a2796a2d5bbbc2edd22857ecc267cba68dfe5d0296f5d84ba7510877b216cc40  MesaLib-10.2.7.zip
-</pre>
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=36193">Bug 36193</a> - [i965] brw_eu_emit.c:182: validate_reg: Assertion `execsize &gt;= width' failed.</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=66184">Bug 66184</a> - src/mesa/state_tracker/st_glsl_to_tgsi.cpp:3216:simplify_cmp: Assertion `inst-&gt;dst.index &lt; 4096' failed.</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=70441">Bug 70441</a> - [Gen4-5 clip] Piglit spec_OpenGL_1.1_polygon-offset hits (execsize &gt;= width) assertion</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=76188">Bug 76188</a> - EGL_EXT_image_dma_buf_import fd ownership is incorrect</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=76789">Bug 76789</a> - [radeonsi] si_descriptors.c requires -std=gnu99 or -fms-extensions</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82139">Bug 82139</a> - [r600g, bisected] multiple ubo piglit regressions</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82255">Bug 82255</a> - [VP2] Chroma planes are vertically stretched during VDPAU playback</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82671">Bug 82671</a> - [r600g-evergreen][compute]Empty kernel execution causes crash</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82709">Bug 82709</a> - OpenCL not working on radeon hainan</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82814">Bug 82814</a> - glDrawBuffers(0, NULL) segfaults in _mesa_drawbuffers</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=83079">Bug 83079</a> - [NVC0] Dota 2 (Linux native and Wine) crash with Nouveau Drivers</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=83355">Bug 83355</a> - FTBFS: src/mesa/program/program_lexer.l:122:64: error: unknown type name 'YYSTYPE'</li>
-
-</ul>
-
-
-<h2>Changes</h2>
-
-<p>Adam Jackson (1):</p>
-<ul>
-  <li>radeonsi: Don't use anonymous struct trick in atom tracking</li>
-</ul>
-
-<p>Alex Deucher (2):</p>
-<ul>
-  <li>radeonsi: add new CIK pci ids</li>
-  <li>radeonsi: add new SI pci ids</li>
-</ul>
-
-<p>Andreas Boll (1):</p>
-<ul>
-  <li>winsys/radeon: fix nop packet padding for hawaii</li>
-</ul>
-
-<p>Anuj Phogat (1):</p>
-<ul>
-  <li>i965: Bail on vec4 copy propagation for scratch writes with source modifiers</li>
-</ul>
-
-<p>Brian Paul (1):</p>
-<ul>
-  <li>mesa: fix NULL pointer deref bug in _mesa_drawbuffers()</li>
-</ul>
-
-<p>Carl Worth (2):</p>
-<ul>
-  <li>docs: Add sha256 sums for the 10.2.6 release</li>
-  <li>Makefile: Switch from md5sums to sha256sums</li>
-</ul>
-
-<p>Dave Airlie (1):</p>
-<ul>
-  <li>i965: add missing parens in vec4 visitor</li>
-</ul>
-
-<p>Emil Velikov (17):</p>
-<ul>
-  <li>configure.ac: bail out if building gallium_gbm without gallium_egl</li>
-  <li>android: gallium/nouveau: fix include folders, link against libstlport</li>
-  <li>android: egl/main: fixup the nouveau build</li>
-  <li>automake: gallium/freedreno: drop spurious include dirs</li>
-  <li>android: gallium/freedreno: add preliminary build</li>
-  <li>android: egl/main: add/enable freedreno</li>
-  <li>android: gallium/auxiliary: drop log2/log2f redefitions</li>
-  <li>android: drop HAL_PIXEL_FORMAT_RGBA_{5551,4444}</li>
-  <li>android: glsl: the stlport over the limited Android STL</li>
-  <li>android: dri/i915: do not build an 'empty' driver</li>
-  <li>cherry-ignore: remove patch that lacking previous dependencies</li>
-  <li>cherry-ignore: PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE is not it 10.2</li>
-  <li>cherry-ignore: drop whitespace fix</li>
-  <li>cherry-ignore: reject a15088338eb</li>
-  <li>get-pick-list.sh: Require explicit "10.2" for nominating stable patches</li>
-  <li>mesa: fix make tarballs</li>
-  <li>Update VERSION to 10.2.7</li>
-</ul>
-
-<p>Ian Romanick (1):</p>
-<ul>
-  <li>mesa: Handle uninitialized textures like other textures in get_tex_level_parameter_image</li>
-</ul>
-
-<p>Ilia Mirkin (9):</p>
-<ul>
-  <li>nouveau: make sure to invalidate any vbo state as well</li>
-  <li>nouveau: don't keep stale pointer to free'd data</li>
-  <li>nvc0/ir: avoid infinite recursion when finding first uses of tex</li>
-  <li>nv50: zero out unbound samplers</li>
-  <li>nvc0: don't make 1d staging textures linear</li>
-  <li>nv50/ir: avoid creating instructions that can't be emitted</li>
-  <li>nv50: set the miptree address when clearing bo's in vp2 init</li>
-  <li>nv50: mt address may not be the underlying bo's start address</li>
-  <li>nv50: attach the buffer bo to the miptree structures</li>
-</ul>
-
-<p>Jan Vesely (1):</p>
-<ul>
-  <li>gallivm: Fix build with latest LLVM</li>
-</ul>
-
-<p>José Fonseca (1):</p>
-<ul>
-  <li>mesa: Move declaration to top of block.</li>
-</ul>
-
-<p>Kenneth Graunke (3):</p>
-<ul>
-  <li>i965/vec4: Set NoMask for GS_OPCODE_SET_VERTEX_COUNT on Gen8+.</li>
-  <li>i965/vec4: Respect ir-&gt;force_writemask_all in Gen8 code generation.</li>
-  <li>i965/clip: Fix brw_clip_unfilled.c/compute_offset's assembly.</li>
-</ul>
-
-<p>Marek Olšák (3):</p>
-<ul>
-  <li>r600g: fix constant buffer fetches</li>
-  <li>radeonsi: save scissor state and sample mask for u_blitter</li>
-  <li>glsl_to_tgsi: allocate and enlarge arrays for temporaries on demand</li>
-</ul>
-
-<p>Paulo Sergio Travaglia (2):</p>
-<ul>
-  <li>android: gallium/radeon: attempt to fix the android build</li>
-  <li>android: egl/main: resolve radeon linking issues</li>
-</ul>
-
-<p>Pekka Paalanen (1):</p>
-<ul>
-  <li>egl_dri2: fix EXT_image_dma_buf_import fds</li>
-</ul>
-
-<p>Robert Bragg (1):</p>
-<ul>
-  <li>meta: save and restore swizzle for _GenerateMipmap</li>
-</ul>
-
-<p>Tom Stellard (7):</p>
-<ul>
-  <li>radeon/compute: Fix reported values for MAX_GLOBAL_SIZE and MAX_MEM_ALLOC_SIZE</li>
-  <li>radeonsi/compute: Update reference counts for buffers in si_set_global_binding()</li>
-  <li>radeonsi/compute: Call si_pm4_free_state() after emitting compute state</li>
-  <li>clover: Flush the command queue in clReleaseCommandQueue()</li>
-  <li>radeon: Add work-around for missing Hainan support in clang &lt; 3.6 v2</li>
-  <li>pipe-loader: Fix memory leak v2</li>
-  <li>r600g/compute: Don't initialize vertex_buffer_state masks to 0x2</li>
-</ul>
-
-<p>Vinson Lee (1):</p>
-<ul>
-  <li>gallivm: Fix build with LLVM &gt;= 3.6 r215967.</li>
-</ul>
-
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.8.html
+++ b/docs/relnotes/10.2.8.html
@@ -1,128 +0,0 @@
-<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
-<html lang="en">
-<head>
-  <meta http-equiv="content-type" content="text/html; charset=utf-8">
-  <title>Mesa Release Notes</title>
-  <link rel="stylesheet" type="text/css" href="../mesa.css">
-</head>
-<body>
-
-<div class="header">
-  <h1>The Mesa 3D Graphics Library</h1>
-</div>
-
-<iframe src="../contents.html"></iframe>
-<div class="content">
-
-<h1>Mesa 10.2.8 Release Notes / September 19, 2014</h1>
-
-<p>
-Mesa 10.2.8 is a bug fix release which fixes bugs found since the 10.2.7 release.
-</p>
-<p>
-Mesa 10.2.8 implements the OpenGL 3.3 API, but the version reported by
-glGetString(GL_VERSION) or glGetIntegerv(GL_MAJOR_VERSION) /
-glGetIntegerv(GL_MINOR_VERSION) depends on the particular driver being used.
-Some drivers don't support all the features required in OpenGL 3.3.  OpenGL
-3.3 is <strong>only</strong> available if requested at context creation
-because compatibility contexts are not supported.
-</p>
-
-<h2>SHA256 checksums</h2>
-<pre>
-TBD
-</pre>
-
-<h2>New features</h2>
-<p>None</p>
-
-<h2>Bug fixes</h2>
-
-<p>This list is likely incomplete.</p>
-
-<ul>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=77493">Bug 77493</a> - lp_test_arit fails with llvm &gt;= llvm-3.5svn r206094</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82539">Bug 82539</a> - vmw_screen_dri.lo In file included from vmw_screen_dri.c:41: vmwgfx_drm.h:32:17: error: drm.h: No such file or directory</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=82882">Bug 82882</a> - [swrast] piglit glsl-fs-uniform-bool-1 regression</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=83432">Bug 83432</a> - r600_query.c:269:r600_emit_query_end: Assertion `ctx-&gt;num_pipelinestat_queries &gt; 0' failed [Gallium HUD]</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=83567">Bug 83567</a> - Mesa 10.2.6 does not compile with llvm 3.5</li>
-
-<li><a href="https://bugs.freedesktop.org/show_bug.cgi?id=83735">Bug 83735</a> - [mesa-10.2.x] broken with llvm-3.5 and old CPUs</li>
-
-</ul>
-
-<h2>Changes</h2>
-<p>Aaron Watry (1):</p>
-<ul>
-  <li>gallivm: Fix build after LLVM commit 211259</li>
-</ul>
-
-<p>Christoph Bumiller (2):</p>
-<ul>
-  <li>nv50/ir/util: fix BitSet issues</li>
-  <li>nvc0/ir: clarify recursion fix to finding first tex uses</li>
-</ul>
-
-<p>Emil Velikov (3):</p>
-<ul>
-  <li>docs: Add sha256 sums for the 10.2.7 release</li>
-  <li>configure: bail out if building svga without libdrm</li>
-  <li>Update VERSION to 10.2.8</li>
-</ul>
-
-<p>Ilia Mirkin (4):</p>
-<ul>
-  <li>nv50/ir: avoid array overrun when checking for supported mods</li>
-  <li>nouveau: only enable the depth test if there actually is a depth buffer</li>
-  <li>nouveau: only enable stencil func if the visual has stencil bits</li>
-  <li>nouveau: change internal variables to avoid conflicts with macro args</li>
-</ul>
-
-<p>Jonathan Gray (1):</p>
-<ul>
-  <li>configure.ac: strip _GNU_SOURCE from llvm-config output</li>
-</ul>
-
-<p>José Fonseca (1):</p>
-<ul>
-  <li>gallivm: Disable workaround for PR12833 on LLVM 3.2+.</li>
-</ul>
-
-<p>Maarten Lankhorst (4):</p>
-<ul>
-  <li>nouveau: re-allocate bo's on overflow</li>
-  <li>nouveau: fix MPEG4 hw decoding</li>
-  <li>nouveau: rework reference frame handling</li>
-  <li>nouveau: remove unneeded assert</li>
-</ul>
-
-<p>Marek Olšák (3):</p>
-<ul>
-  <li>r600g,radeonsi: make sure there's enough CS space before resuming queries</li>
-  <li>mesa: set UniformBooleanTrue = 1.0f by default</li>
-  <li>st/mesa: use 1.0f as boolean true on drivers without integer support</li>
-</ul>
-
-<p>Richard Sandiford (1):</p>
-<ul>
-  <li>gallivm: Fix uses of 2^24</li>
-</ul>
-
-<p>Roland Scheidegger (1):</p>
-<ul>
-  <li>gallivm: set mcpu when initializing llvm execution engine</li>
-</ul>
-
-<p>Thomas Hellstrom (1):</p>
-<ul>
-  <li>winsys/svga: Fix incorrect type usage in IOCTL v2</li>
-</ul>
-
-</div>
-</body>
-</html>
--- a/docs/relnotes/10.2.html
+++ b/docs/relnotes/10.2.html
@@ -14,7 +14,7 @@
 <iframe src="../contents.html"></iframe>
 <div class="content">

-<h1>Mesa 10.2 Release Notes / June 6, 2014</h1>
+<h1>Mesa 10.2 Release Notes / TBD</h1>

 <p>
 Mesa 10.2 is a new development release.
@@ -33,9 +33,7 @@ because compatibility contexts are not supported.

 <h2>MD5 checksums</h2>
 <pre>
-c87bfb6dd5cbcf1fdef42e5ccd972581  MesaLib-10.2.0.tar.gz
-7aaba90bd7169a94ae2fe83febdec963  MesaLib-10.2.0.tar.bz2
-58b203aca15dadc25ab4d1126db1052b  MesaLib-10.2.0.zip
+TBD.
 </pre>


@@ -69,25 +67,6 @@ TBD.
 <h2>Changes</h2>

 <ul>
-<li>Renamed <i>--with-llvm-shared-libs</i> to <i>--enable-llvm-shared-libs</i></li>
-<p>
-The option is used to control how mesa is linked against LLVM, and now
-defaults to enabled (shared linking).
-</p>
-
-<li>Split <i>libxatracker.so</i> into a standalone library which can be used
-with any gallium driver.</li>
-<p>
-Previously the library was linked statically against vmware's virtual gpu
-driver(svga), whereas now it loads a shared pipe_*.so driver. Provide the
-following options during configure, if you would like support for svga driver
-<i>--enable-xa --with-gallium-drivers=svga</i>
-</p>
-
-<p>
-Note: The files are installed in $(libdir)/gallium-pipe/ and the interface
-between them and libxatracker.so is <strong>not</strong> stable.
-</p>
 </ul>

 </div>
--- a/include/GL/glx.h
+++ b/include/GL/glx.h
@@ -518,7 +518,7 @@ typedef struct {
    unsigned long serial;	/* # of last request processed by server */
    Bool send_event;		/* true if this came from a SendEvent request */
    Display *display;		/* Display the event was read from */
-    Drawable drawable;	/* drawable on which event was requested in event mask */
+    GLXDrawable drawable;	/* drawable on which event was requested in event mask */
    int event_type;
    int64_t ust;
    int64_t msc;
--- a/include/pci_ids/i965_pci_ids.h
+++ b/include/pci_ids/i965_pci_ids.h
@@ -91,24 +91,24 @@ CHIPSET(0x0F32, byt,     "Intel(R) Bay Trail")
 CHIPSET(0x0F33, byt,     "Intel(R) Bay Trail")
 CHIPSET(0x0157, byt,     "Intel(R) Bay Trail")
 CHIPSET(0x0155, byt,     "Intel(R) Bay Trail")
-CHIPSET(0x1602, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x1606, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x160A, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x160B, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x160D, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x160E, bdw_gt1, "Intel(R) Broadwell GT1")
-CHIPSET(0x1612, bdw_gt2, "Intel(R) HD Graphics 5600 (Broadwell GT2)")
-CHIPSET(0x1616, bdw_gt2, "Intel(R) HD Graphics 5500 (Broadwell GT2)")
-CHIPSET(0x161A, bdw_gt2, "Intel(R) Broadwell GT2")
-CHIPSET(0x161B, bdw_gt2, "Intel(R) Broadwell GT2")
-CHIPSET(0x161D, bdw_gt2, "Intel(R) Broadwell GT2")
-CHIPSET(0x161E, bdw_gt2, "Intel(R) HD Graphics 5300 (Broadwell GT2)")
-CHIPSET(0x1622, bdw_gt3, "Intel(R) Iris Pro 6200 (Broadwell GT3e)")
-CHIPSET(0x1626, bdw_gt3, "Intel(R) HD Graphics 6000 (Broadwell GT3)")
-CHIPSET(0x162A, bdw_gt3, "Intel(R) Iris Pro P6300 (Broadwell GT3e)")
-CHIPSET(0x162B, bdw_gt3, "Intel(R) Iris 6100 (Broadwell GT3)")
-CHIPSET(0x162D, bdw_gt3, "Intel(R) Broadwell GT3")
-CHIPSET(0x162E, bdw_gt3, "Intel(R) Broadwell GT3")
+CHIPSET(0x1602, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x1606, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x160A, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x160B, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x160D, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x160E, bdw_gt1, "Intel(R) Broadwell")
+CHIPSET(0x1612, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x1616, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x161A, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x161B, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x161D, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x161E, bdw_gt2, "Intel(R) Broadwell")
+CHIPSET(0x1622, bdw_gt3, "Intel(R) Broadwell")
+CHIPSET(0x1626, bdw_gt3, "Intel(R) Broadwell")
+CHIPSET(0x162A, bdw_gt3, "Intel(R) Broadwell")
+CHIPSET(0x162B, bdw_gt3, "Intel(R) Broadwell")
+CHIPSET(0x162D, bdw_gt3, "Intel(R) Broadwell")
+CHIPSET(0x162E, bdw_gt3, "Intel(R) Broadwell")
 CHIPSET(0x22B0, chv,     "Intel(R) Cherryview")
 CHIPSET(0x22B1, chv,     "Intel(R) Cherryview")
 CHIPSET(0x22B2, chv,     "Intel(R) Cherryview")
--- a/include/pci_ids/radeonsi_pci_ids.h
+++ b/include/pci_ids/radeonsi_pci_ids.h
@@ -38,7 +38,6 @@ CHIPSET(0x6828, VERDE_6828, VERDE)
 CHIPSET(0x6829, VERDE_6829, VERDE)
 CHIPSET(0x682A, VERDE_682A, VERDE)
 CHIPSET(0x682B, VERDE_682B, VERDE)
-CHIPSET(0x682C, VERDE_682C, VERDE)
 CHIPSET(0x682D, VERDE_682D, VERDE)
 CHIPSET(0x682F, VERDE_682F, VERDE)
 CHIPSET(0x6830, VERDE_6830, VERDE)
@@ -55,11 +54,8 @@ CHIPSET(0x6600, OLAND_6600, OLAND)
 CHIPSET(0x6601, OLAND_6601, OLAND)
 CHIPSET(0x6602, OLAND_6602, OLAND)
 CHIPSET(0x6603, OLAND_6603, OLAND)
-CHIPSET(0x6604, OLAND_6604, OLAND)
-CHIPSET(0x6605, OLAND_6605, OLAND)
 CHIPSET(0x6606, OLAND_6606, OLAND)
 CHIPSET(0x6607, OLAND_6607, OLAND)
-CHIPSET(0x6608, OLAND_6608, OLAND)
 CHIPSET(0x6610, OLAND_6610, OLAND)
 CHIPSET(0x6611, OLAND_6611, OLAND)
 CHIPSET(0x6613, OLAND_6613, OLAND)
@@ -77,8 +73,6 @@ CHIPSET(0x666F, HAINAN_666F, HAINAN)

 CHIPSET(0x6640, BONAIRE_6640, BONAIRE)
 CHIPSET(0x6641, BONAIRE_6641, BONAIRE)
-CHIPSET(0x6646, BONAIRE_6646, BONAIRE)
-CHIPSET(0x6647, BONAIRE_6647, BONAIRE)
 CHIPSET(0x6649, BONAIRE_6649, BONAIRE)
 CHIPSET(0x6650, BONAIRE_6650, BONAIRE)
 CHIPSET(0x6651, BONAIRE_6651, BONAIRE)
@@ -138,7 +132,6 @@ CHIPSET(0x1313, KAVERI_1313, KAVERI)
 CHIPSET(0x1315, KAVERI_1315, KAVERI)
 CHIPSET(0x1316, KAVERI_1316, KAVERI)
 CHIPSET(0x1317, KAVERI_1317, KAVERI)
-CHIPSET(0x1318, KAVERI_1318, KAVERI)
 CHIPSET(0x131B, KAVERI_131B, KAVERI)
 CHIPSET(0x131C, KAVERI_131C, KAVERI)
 CHIPSET(0x131D, KAVERI_131D, KAVERI)
--- a/src/egl/drivers/dri2/Android.mk
+++ b/src/egl/drivers/dri2/Android.mk
@@ -40,12 +40,8 @@ LOCAL_C_INCLUDES := \
 	$(MESA_TOP)/src/mapi \
 	$(MESA_TOP)/src/egl/main \
 	$(MESA_TOP)/src/loader \
-	$(DRM_TOP)/include/drm \
 	$(DRM_GRALLOC_TOP)

-LOCAL_STATIC_LIBRARIES := \
-	libloader
-
 LOCAL_MODULE := libmesa_egl_dri2

 include $(MESA_COMMON_MK)
--- a/src/egl/drivers/dri2/egl_dri2.c
+++ b/src/egl/drivers/dri2/egl_dri2.c
@@ -1663,13 +1663,36 @@ dri2_check_dma_buf_format(const _EGLImageAttribs *attrs)
 /**
 * The spec says:
 *
- * "If eglCreateImageKHR is successful for a EGL_LINUX_DMA_BUF_EXT target, the
- *  EGL will take a reference to the dma_buf(s) which it will release at any
- *  time while the EGLDisplay is initialized. It is the responsibility of the
- *  application to close the dma_buf file descriptors."
- *
- * Therefore we must never close or otherwise modify the file descriptors.
+ * "If eglCreateImageKHR is successful for a EGL_LINUX_DMA_BUF_EXT target,
+ *  the EGL takes ownership of the file descriptor and is responsible for
+ *  closing it, which it may do at any time while the EGLDisplay is
+ *  initialized."
 */
+static void
+dri2_take_dma_buf_ownership(const int *fds, unsigned num_fds)
+{
+   int already_closed[num_fds];
+   unsigned num_closed = 0;
+   unsigned i, j;
+
+   for (i = 0; i < num_fds; ++i) {
+      /**
+       * The same file descriptor can be referenced multiple times in case more
+       * than one plane is found in the same buffer, just with a different
+       * offset.
+       */
+      for (j = 0; j < num_closed; ++j) {
+         if (already_closed[j] == fds[i])
+            break;
+      }
+
+      if (j == num_closed) {
+         close(fds[i]);
+         already_closed[num_closed++] = fds[i];
+      }
+   }
+}
+
 static _EGLImage *
 dri2_create_image_dma_buf(_EGLDisplay *disp, _EGLContext *ctx,
 			  EGLClientBuffer buffer, const EGLint *attr_list)
@@ -1732,6 +1755,8 @@ dri2_create_image_dma_buf(_EGLDisplay *disp, _EGLContext *ctx,
      return EGL_NO_IMAGE_KHR;

   res = dri2_create_image_from_dri(disp, dri_image);
+   if (res)
+      dri2_take_dma_buf_ownership(fds, num_fds);

   return res;
 }
--- a/src/egl/drivers/dri2/platform_android.c
+++ b/src/egl/drivers/dri2/platform_android.c
@@ -54,6 +54,8 @@ get_format_bpp(int native)
      bpp = 3;
      break;
   case HAL_PIXEL_FORMAT_RGB_565:
+   case HAL_PIXEL_FORMAT_RGBA_5551:
+   case HAL_PIXEL_FORMAT_RGBA_4444:
      bpp = 2;
      break;
   default:
@@ -369,6 +371,8 @@ dri2_create_image_android_native_buffer(_EGLDisplay *disp, _EGLContext *ctx,
      format = __DRI_IMAGE_FORMAT_XBGR8888;
      break;
   case HAL_PIXEL_FORMAT_RGB_888:
+   case HAL_PIXEL_FORMAT_RGBA_5551:
+   case HAL_PIXEL_FORMAT_RGBA_4444:
      /* unsupported */
   default:
      _eglLog(_EGL_WARNING, "unsupported native buffer format 0x%x", buf->format);
@@ -634,7 +638,7 @@ droid_log(EGLint level, const char *msg)
 static struct dri2_egl_display_vtbl droid_display_vtbl = {
   .authenticate = NULL,
   .create_window_surface = droid_create_window_surface,
-   .create_pixmap_surface = dri2_fallback_create_pixmap_surface,
+   .create_pixmap_surface = dri2_fallback_pixmap_surface,
   .create_pbuffer_surface = droid_create_pbuffer_surface,
   .destroy_surface = droid_destroy_surface,
   .create_image = droid_create_image_khr,
--- a/src/egl/main/Android.mk
+++ b/src/egl/main/Android.mk
@@ -95,12 +95,6 @@ gallium_DRIVERS :=
 # swrast
 gallium_DRIVERS += libmesa_pipe_softpipe libmesa_winsys_sw_android

-# freedreno
-ifneq ($(filter freedreno, $(MESA_GPU_DRIVERS)),)
-gallium_DRIVERS += libmesa_winsys_freedreno libmesa_pipe_freedreno
-LOCAL_SHARED_LIBRARIES += libdrm_freedreno
-endif
-
 # i915g
 ifneq ($(filter i915g, $(MESA_GPU_DRIVERS)),)
 gallium_DRIVERS += libmesa_winsys_i915 libmesa_pipe_i915
@@ -115,29 +109,28 @@ endif

 # nouveau
 ifneq ($(filter nouveau, $(MESA_GPU_DRIVERS)),)
-gallium_DRIVERS +=  libmesa_winsys_nouveau libmesa_pipe_nouveau
+gallium_DRIVERS += \
+	libmesa_winsys_nouveau \
+	libmesa_pipe_nvfx \
+	libmesa_pipe_nv50 \
+	libmesa_pipe_nvc0 \
+	libmesa_pipe_nouveau
 LOCAL_SHARED_LIBRARIES += libdrm_nouveau
-LOCAL_SHARED_LIBRARIES += libstlport
 endif

 # r300g/r600g/radeonsi
 ifneq ($(filter r300g r600g radeonsi, $(MESA_GPU_DRIVERS)),)
 gallium_DRIVERS += libmesa_winsys_radeon
-LOCAL_SHARED_LIBRARIES += libdrm_radeon
 ifneq ($(filter r300g, $(MESA_GPU_DRIVERS)),)
 gallium_DRIVERS += libmesa_pipe_r300
-endif # r300g
-ifneq ($(filter r600g radeonsi, $(MESA_GPU_DRIVERS)),)
+endif
 ifneq ($(filter r600g, $(MESA_GPU_DRIVERS)),)
 gallium_DRIVERS += libmesa_pipe_r600
-LOCAL_SHARED_LIBRARIES += libstlport
-endif # r600g
+endif
 ifneq ($(filter radeonsi, $(MESA_GPU_DRIVERS)),)
 gallium_DRIVERS += libmesa_pipe_radeonsi
-endif # radeonsi
-gallium_DRIVERS += libmesa_pipe_radeon
-endif # r600g || radeonsi
-endif # r300g || r600g || radeonsi
+endif
+endif

 # vmwgfx
 ifneq ($(filter vmwgfx, $(MESA_GPU_DRIVERS)),)
@@ -161,14 +154,11 @@ LOCAL_STATIC_LIBRARIES := \
 	libmesa_glsl \
 	libmesa_glsl_utils \
 	libmesa_gallium \
+	libloader \
 	$(LOCAL_STATIC_LIBRARIES)

 endif # MESA_BUILD_GALLIUM

-LOCAL_STATIC_LIBRARIES := \
-	$(LOCAL_STATIC_LIBRARIES) \
-	libloader
-
 LOCAL_MODULE := libGLES_mesa
 LOCAL_MODULE_PATH := $(TARGET_OUT_SHARED_LIBRARIES)/egl

--- a/src/egl/main/eglapi.c
+++ b/src/egl/main/eglapi.c
@@ -524,12 +524,8 @@ eglMakeCurrent(EGLDisplay dpy, EGLSurface draw, EGLSurface read,
   if (!context && ctx != EGL_NO_CONTEXT)
      RETURN_EGL_ERROR(disp, EGL_BAD_CONTEXT, EGL_FALSE);
   if (!draw_surf || !read_surf) {
-      /* From the EGL 1.4 (20130211) spec:
-       *
-       *    To release the current context without assigning a new one, set ctx
-       *    to EGL_NO_CONTEXT and set draw and read to EGL_NO_SURFACE.
-       */
-      if (!disp->Extensions.KHR_surfaceless_context && ctx != EGL_NO_CONTEXT)
+      /* surfaces may be NULL if surfaceless */
+      if (!disp->Extensions.KHR_surfaceless_context)
         RETURN_EGL_ERROR(disp, EGL_BAD_SURFACE, EGL_FALSE);

      if ((!draw_surf && draw != EGL_NO_SURFACE) ||
@@ -571,10 +567,6 @@ _eglCreateWindowSurfaceCommon(_EGLDisplay *disp, EGLConfig config,
   EGLSurface ret;

   _EGL_CHECK_CONFIG(disp, conf, EGL_NO_SURFACE, drv);
-
-   if (native_window == NULL)
-      RETURN_EGL_ERROR(disp, EGL_BAD_NATIVE_WINDOW, EGL_NO_SURFACE);
-
   surf = drv->API.CreateWindowSurface(drv, disp, conf, native_window,
                                       attrib_list);
   ret = (surf) ? _eglLinkSurface(surf) : EGL_NO_SURFACE;
--- a/src/egl/main/eglcontext.c
+++ b/src/egl/main/eglcontext.c
@@ -322,14 +322,11 @@ _eglParseContextAttribList(_EGLContext *ctx, _EGLDisplay *dpy,
         break;

      case 3:
+      default:
         /* Don't put additional version checks here.  We don't know that
          * there won't be versions > 3.0.
          */
         break;
-
-      default:
-         err = EGL_BAD_MATCH;
-         break;
      }
   }

--- a/src/egl/wayland/wayland-drm/wayland-drm.xml
+++ b/src/egl/wayland/wayland-drm/wayland-drm.xml
@@ -135,6 +135,22 @@
      <arg name="stride2" type="int"/>
    </request>

+    <!-- Create a wayland buffer for the prime fd.  Use for regular and planar
+         buffers.  Pass 0 for offset and stride for unused planes. -->
+    <request name="create_prime_buffer" since="2">
+      <arg name="id" type="new_id" interface="wl_buffer"/>
+      <arg name="name" type="fd"/>
+      <arg name="width" type="int"/>
+      <arg name="height" type="int"/>
+      <arg name="format" type="uint"/>
+      <arg name="offset0" type="int"/>
+      <arg name="stride0" type="int"/>
+      <arg name="offset1" type="int"/>
+      <arg name="stride1" type="int"/>
+      <arg name="offset2" type="int"/>
+      <arg name="stride2" type="int"/>
+    </request>
+
    <!-- Notification of the path of the drm device which is used by
         the server.  The client should use this device for creating
         local buffers.  Only buffers created from this device should
@@ -161,25 +177,6 @@
    <event name="capabilities">
      <arg name="value" type="uint"/>
    </event>
-
-    <!-- Version 2 additions -->
-
-    <!-- Create a wayland buffer for the prime fd.  Use for regular and planar
-         buffers.  Pass 0 for offset and stride for unused planes. -->
-    <request name="create_prime_buffer" since="2">
-      <arg name="id" type="new_id" interface="wl_buffer"/>
-      <arg name="name" type="fd"/>
-      <arg name="width" type="int"/>
-      <arg name="height" type="int"/>
-      <arg name="format" type="uint"/>
-      <arg name="offset0" type="int"/>
-      <arg name="stride0" type="int"/>
-      <arg name="offset1" type="int"/>
-      <arg name="stride1" type="int"/>
-      <arg name="offset2" type="int"/>
-      <arg name="stride2" type="int"/>
-    </request>
-
  </interface>

 </protocol>
--- a/src/gallium/Android.mk
+++ b/src/gallium/Android.mk
@@ -34,11 +34,6 @@ SUBDIRS := \
 # swrast
 SUBDIRS += winsys/sw/android drivers/softpipe

-# freedreno
-ifneq ($(filter freedreno, $(MESA_GPU_DRIVERS)),)
-SUBDIRS += winsys/freedreno/drm drivers/freedreno
-endif
-
 # i915g
 ifneq ($(filter i915g, $(MESA_GPU_DRIVERS)),)
 SUBDIRS += winsys/i915/drm drivers/i915
@@ -62,8 +57,6 @@ SUBDIRS += winsys/radeon/drm
 ifneq ($(filter r300g, $(MESA_GPU_DRIVERS)),)
 SUBDIRS += drivers/r300
 endif
-ifneq ($(filter r600g radeonsi, $(MESA_GPU_DRIVERS)),)
-SUBDIRS += drivers/radeon
 ifneq ($(filter r600g, $(MESA_GPU_DRIVERS)),)
 SUBDIRS += drivers/r600
 endif
@@ -71,7 +64,6 @@ ifneq ($(filter radeonsi, $(MESA_GPU_DRIVERS)),)
 SUBDIRS += drivers/radeonsi
 endif
 endif
-endif

 # vmwgfx
 ifneq ($(filter vmwgfx, $(MESA_GPU_DRIVERS)),)
--- a/src/gallium/auxiliary/draw/draw_private.h
+++ b/src/gallium/auxiliary/draw/draw_private.h
@@ -493,7 +493,7 @@ draw_stats_clipper_primitives(struct draw_context *draw,
 static INLINE unsigned
 draw_clamp_viewport_idx(int idx)
 {
-   return ((PIPE_MAX_VIEWPORTS > idx && idx >= 0) ? idx : 0);
+   return ((PIPE_MAX_VIEWPORTS > idx || idx < 0) ? idx : 0);
 }

 /**
--- a/src/gallium/auxiliary/gallivm/lp_bld_arit.c
+++ b/src/gallium/auxiliary/gallivm/lp_bld_arit.c
@@ -1852,7 +1852,7 @@ lp_build_trunc(struct lp_build_context *bld,
      const struct lp_type type = bld->type;
      struct lp_type inttype;
      struct lp_build_context intbld;
-      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 1<<24);
+      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 2^24);
      LLVMValueRef trunc, res, anosign, mask;
      LLVMTypeRef int_vec_type = bld->int_vec_type;
      LLVMTypeRef vec_type = bld->vec_type;
@@ -1907,7 +1907,7 @@ lp_build_round(struct lp_build_context *bld,
      const struct lp_type type = bld->type;
      struct lp_type inttype;
      struct lp_build_context intbld;
-      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 1<<24);
+      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 2^24);
      LLVMValueRef res, anosign, mask;
      LLVMTypeRef int_vec_type = bld->int_vec_type;
      LLVMTypeRef vec_type = bld->vec_type;
@@ -1960,7 +1960,7 @@ lp_build_floor(struct lp_build_context *bld,
      const struct lp_type type = bld->type;
      struct lp_type inttype;
      struct lp_build_context intbld;
-      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 1<<24);
+      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 2^24);
      LLVMValueRef trunc, res, anosign, mask;
      LLVMTypeRef int_vec_type = bld->int_vec_type;
      LLVMTypeRef vec_type = bld->vec_type;
@@ -2029,7 +2029,7 @@ lp_build_ceil(struct lp_build_context *bld,
      const struct lp_type type = bld->type;
      struct lp_type inttype;
      struct lp_build_context intbld;
-      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 1<<24);
+      LLVMValueRef cmpval = lp_build_const_vec(bld->gallivm, type, 2^24);
      LLVMValueRef trunc, res, anosign, mask, tmp;
      LLVMTypeRef int_vec_type = bld->int_vec_type;
      LLVMTypeRef vec_type = bld->vec_type;
--- a/src/gallium/auxiliary/gallivm/lp_bld_debug.cpp
+++ b/src/gallium/auxiliary/gallivm/lp_bld_debug.cpp
@@ -34,10 +34,6 @@
 #include <llvm/Support/Format.h>
 #include <llvm/Support/MemoryObject.h>

-#if HAVE_LLVM >= 0x0306
-#include <llvm/Target/TargetSubtargetInfo.h>
-#endif
-
 #if HAVE_LLVM >= 0x0300
 #include <llvm/Support/TargetRegistry.h>
 #include <llvm/MC/MCSubtargetInfo.h>
@@ -61,9 +57,7 @@
 #include <llvm/MC/MCRegisterInfo.h>
 #endif /* HAVE_LLVM >= 0x0301 */

-#if HAVE_LLVM >= 0x0305
-#define OwningPtr std::unique_ptr
-#elif HAVE_LLVM >= 0x0303
+#if HAVE_LLVM >= 0x0303
 #include <llvm/ADT/OwningPtr.h>
 #endif

@@ -308,11 +302,7 @@ disassemble(const void* func, llvm::raw_ostream & Out)
   OwningPtr<TargetMachine> TM(T->createTargetMachine(Triple, ""));
 #endif

-#if HAVE_LLVM >= 0x0306
-   const TargetInstrInfo *TII = TM->getSubtargetImpl()->getInstrInfo();
-#else
   const TargetInstrInfo *TII = TM->getInstrInfo();
-#endif

   /*
    * Wrap the data in a MemoryObject
--- a/src/gallium/auxiliary/gallivm/lp_bld_misc.cpp
+++ b/src/gallium/auxiliary/gallivm/lp_bld_misc.cpp
@@ -73,10 +73,6 @@
 #include <llvm/Support/CBindingWrapping.h>
 #endif

-#if HAVE_LLVM >= 0x0305
-#include <llvm/Support/Host.h>
-#endif
-
 #include "pipe/p_config.h"
 #include "util/u_debug.h"
 #include "util/u_cpu_detect.h"
@@ -270,11 +266,7 @@ lp_build_create_jit_compiler_for_module(LLVMExecutionEngineRef *OutJIT,
   using namespace llvm;

   std::string Error;
-#if HAVE_LLVM >= 0x0306
-   EngineBuilder builder(std::unique_ptr<Module>(unwrap(M)));
-#else
   EngineBuilder builder(unwrap(M));
-#endif

   /**
    * LLVM 3.1+ haven't more "extern unsigned llvm::StackAlignmentOverride" and
@@ -313,8 +305,8 @@ lp_build_create_jit_compiler_for_module(LLVMExecutionEngineRef *OutJIT,
      /*
       * AVX feature is not automatically detected from CPUID by the X86 target
       * yet, because the old (yet default) JIT engine is not capable of
-       * emitting the opcodes. On newer llvm versions it is and at least some
-       * versions (tested with 3.3) will emit avx opcodes without this anyway.
+       * emitting the opcodes.  But as we're using MCJIT here, it is safe to
+       * add set this attribute.
       */
      MAttrs.push_back("+avx");
      if (util_cpu_caps.has_f16c) {
@@ -324,30 +316,12 @@ lp_build_create_jit_compiler_for_module(LLVMExecutionEngineRef *OutJIT,
   }
   builder.setJITMemoryManager(JITMemoryManager::CreateDefaultMemManager());

-#if HAVE_LLVM >= 0x0305
-   StringRef MCPU = llvm::sys::getHostCPUName();
-   /*
-    * The cpu bits are no longer set automatically, so need to set mcpu manually.
-    * Note that the MAttrs set above will be sort of ignored (since we should
-    * not set any which would not be set by specifying the cpu anyway).
-    * It ought to be safe though since getHostCPUName() should include bits
-    * not only from the cpu but environment as well (for instance if it's safe
-    * to use avx instructions which need OS support). According to
-    * http://llvm.org/bugs/show_bug.cgi?id=19429 however if I understand this
-    * right it may be necessary to specify older cpu (or disable mattrs) though
-    * when not using MCJIT so no instructions are generated which the old JIT
-    * can't handle. Not entirely sure if we really need to do anything yet.
-    */
-   builder.setMCPU(MCPU);
-#endif
-
   ExecutionEngine *JIT;
-
-#if HAVE_LLVM >= 0x0302
+#if 0
   JIT = builder.create();
 #else
   /*
-    * Workaround http://llvm.org/PR12833
+    * Workaround http://llvm.org/bugs/show_bug.cgi?id=12833
    */
   StringRef MArch = "";
   StringRef MCPU = "";
--- a/src/gallium/auxiliary/gallivm/lp_bld_sample.c
+++ b/src/gallium/auxiliary/gallivm/lp_bld_sample.c
@@ -927,7 +927,6 @@ lp_build_nearest_mip_level(struct lp_build_sample_context *bld,
                                                                bld->int_coord_bld.type,
                                                                out);
      }
-      level = lp_build_andnot(&bld->int_coord_bld, level, *out_of_bounds);
      *level_out = level;
   }
   else {
--- a/src/gallium/auxiliary/pipe-loader/pipe_loader.h
+++ b/src/gallium/auxiliary/pipe-loader/pipe_loader.h
@@ -66,7 +66,7 @@ struct pipe_loader_device {
      } pci;
   } u; /**< Discriminated by \a type */

-   char *driver_name;
+   const char *driver_name;
   const struct pipe_loader_ops *ops;
 };

--- a/src/gallium/auxiliary/pipe-loader/pipe_loader_drm.c
+++ b/src/gallium/auxiliary/pipe-loader/pipe_loader_drm.c
@@ -256,7 +256,6 @@ pipe_loader_drm_release(struct pipe_loader_device **dev)
      util_dl_close(ddev->lib);

   close(ddev->fd);
-   FREE(ddev->base.driver_name);
   FREE(ddev);
   *dev = NULL;
 }
--- a/src/gallium/auxiliary/tgsi/tgsi_strings.c
+++ b/src/gallium/auxiliary/tgsi/tgsi_strings.c
@@ -120,8 +120,7 @@ const char *tgsi_property_names[TGSI_PROPERTY_COUNT] =
   "FS_COORD_PIXEL_CENTER",
   "FS_COLOR0_WRITES_ALL_CBUFS",
   "FS_DEPTH_LAYOUT",
-   "VS_PROHIBIT_UCPS",
-   "GS_INVOCATIONS",
+   "VS_PROHIBIT_UCPS"
 };

 const char *tgsi_type_names[5] =
--- a/src/gallium/auxiliary/util/u_blitter.c
+++ b/src/gallium/auxiliary/util/u_blitter.c
@@ -383,15 +383,6 @@ void util_blitter_destroy(struct blitter_context *blitter)
      if (ctx->fs_texfetch_stencil[i])
         ctx->delete_fs_state(pipe, ctx->fs_texfetch_stencil[i]);

-      if (ctx->fs_texfetch_col_msaa[i])
-         ctx->delete_fs_state(pipe, ctx->fs_texfetch_col_msaa[i]);
-      if (ctx->fs_texfetch_depth_msaa[i])
-         ctx->delete_fs_state(pipe, ctx->fs_texfetch_depth_msaa[i]);
-      if (ctx->fs_texfetch_depthstencil_msaa[i])
-         ctx->delete_fs_state(pipe, ctx->fs_texfetch_depthstencil_msaa[i]);
-      if (ctx->fs_texfetch_stencil_msaa[i])
-         ctx->delete_fs_state(pipe, ctx->fs_texfetch_stencil_msaa[i]);
-
      for (j = 0; j< Elements(ctx->fs_resolve[i]); j++)
         for (f = 0; f < 2; f++)
            if (ctx->fs_resolve[i][j][f])
--- a/src/gallium/auxiliary/util/u_math.h
+++ b/src/gallium/auxiliary/util/u_math.h
@@ -149,6 +149,28 @@ roundf(float x)
 #endif /* _MSC_VER */


+#ifdef PIPE_OS_ANDROID
+
+static INLINE
+double log2(double d)
+{
+   return log(d) * (1.0 / M_LN2);
+}
+
+/* workaround a conflict with main/imports.h */
+#ifdef log2f
+#undef log2f
+#endif
+
+static INLINE
+float log2f(float f)
+{
+   return logf(f) * (float) (1.0 / M_LN2);
+}
+
+#endif
+
+
 #if __STDC_VERSION__ < 199901L && (!defined(__cplusplus) || defined(_MSC_VER))
 static INLINE long int
 lrint(double d)
--- a/src/gallium/auxiliary/util/u_prim.h
+++ b/src/gallium/auxiliary/util/u_prim.h
@@ -136,21 +136,6 @@ u_prim_vertex_count(unsigned prim)
   return (likely(prim < PIPE_PRIM_MAX)) ? &prim_table[prim] : NULL;
 }

-/**
- * Given a vertex count, return the number of primitives.
- * For polygons, return the number of triangles.
- */
-static INLINE unsigned
-u_prims_for_vertices(unsigned prim, unsigned num)
-{
-   const struct u_prim_vertex_count *info = u_prim_vertex_count(prim);
-
-   if (num < info->min)
-      return 0;
-
-   return 1 + ((num - info->min) / info->incr);
-}
-
 static INLINE boolean u_validate_pipe_prim( unsigned pipe_prim, unsigned nr )
 {
   const struct u_prim_vertex_count *count = u_prim_vertex_count(pipe_prim);
--- a/src/gallium/auxiliary/util/u_transfer.c
+++ b/src/gallium/auxiliary/util/u_transfer.c
@@ -25,8 +25,8 @@ void u_default_transfer_inline_write( struct pipe_context *pipe,
   usage |= PIPE_TRANSFER_WRITE;

   /* transfer_inline_write implicitly discards the rewritten buffer range */
-   if (resource->target == PIPE_BUFFER &&
-       box->x == 0 && box->width == resource->width0) {
+   /* XXX this looks very broken for non-buffer resources having more than one dim. */
+   if (box->x == 0 && box->width == resource->width0) {
      usage |= PIPE_TRANSFER_DISCARD_WHOLE_RESOURCE;
   } else {
      usage |= PIPE_TRANSFER_DISCARD_RANGE;
--- a/src/gallium/drivers/freedreno/Android.mk
+++ b/src/gallium/drivers/freedreno/Android.mk
@@ -1,44 +0,0 @@
-# Copyright (C) 2014 Emil Velikov <emil.l.velikov@gmail.com>
-#
-# Permission is hereby granted, free of charge, to any person obtaining a
-# copy of this software and associated documentation files (the "Software"),
-# to deal in the Software without restriction, including without limitation
-# the rights to use, copy, modify, merge, publish, distribute, sublicense,
-# and/or sell copies of the Software, and to permit persons to whom the
-# Software is furnished to do so, subject to the following conditions:
-#
-# The above copyright notice and this permission notice shall be included
-# in all copies or substantial portions of the Software.
-#
-# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
-# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
-# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
-# DEALINGS IN THE SOFTWARE.
-
-LOCAL_PATH := $(call my-dir)
-
-# get C_SOURCES
-include $(LOCAL_PATH)/Makefile.sources
-
-include $(CLEAR_VARS)
-
-LOCAL_SRC_FILES := \
-	$(C_SOURCES) \
-	$(a2xx_SOURCES) \
-	$(a3xx_SOURCES)
-
-LOCAL_CFLAGS := \
-	-Wno-packed-bitfield-compat
-
-LOCAL_C_INCLUDES := \
-	$(LOCAL_PATH)/ir3 \
-	$(TARGET_OUT_HEADERS)/libdrm \
-	$(TARGET_OUT_HEADERS)/freedreno
-
-LOCAL_MODULE := libmesa_pipe_freedreno
-
-include $(GALLIUM_COMMON_MK)
-include $(BUILD_STATIC_LIBRARY)
--- a/src/gallium/drivers/freedreno/Makefile.am
+++ b/src/gallium/drivers/freedreno/Makefile.am
@@ -5,6 +5,8 @@ include $(top_srcdir)/src/gallium/Automake.inc

 AM_CFLAGS = \
 	-Wno-packed-bitfield-compat \
+	-I$(top_srcdir)/src/gallium/drivers/freedreno/a3xx \
+	-I$(top_srcdir)/src/gallium/drivers/freedreno/a2xx \
 	$(GALLIUM_DRIVER_CFLAGS) \
 	$(FREEDRENO_CFLAGS)

--- a/src/gallium/drivers/freedreno/Makefile.sources
+++ b/src/gallium/drivers/freedreno/Makefile.sources
@@ -3,8 +3,6 @@ C_SOURCES := \
 	freedreno_lowering.c \
 	freedreno_program.c \
 	freedreno_query.c \
-	freedreno_query_hw.c \
-	freedreno_query_sw.c \
 	freedreno_fence.c \
 	freedreno_resource.c \
 	freedreno_surface.c \
@@ -40,7 +38,6 @@ a3xx_SOURCES := \
 	a3xx/fd3_emit.c \
 	a3xx/fd3_gmem.c \
 	a3xx/fd3_program.c \
-	a3xx/fd3_query.c \
 	a3xx/fd3_rasterizer.c \
 	a3xx/fd3_screen.c \
 	a3xx/fd3_texture.c \
--- a/src/gallium/drivers/freedreno/a2xx/a2xx.xml.h
+++ b/src/gallium/drivers/freedreno/a2xx/a2xx.xml.h
@@ -10,11 +10,11 @@ git clone https://github.com/freedreno/envytools.git
 The rules-ng-ng source files this header was generated from are:
 - /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    364 bytes, from 2013-11-30 14:47:15)
 - /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1453 bytes, from 2013-03-31 16:51:27)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32901 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9859 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  14477 bytes, from 2014-05-16 11:51:57)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  58020 bytes, from 2014-06-13 17:29:47)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (  26602 bytes, from 2014-06-13 17:28:10)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32840 bytes, from 2014-01-05 14:44:21)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9009 bytes, from 2014-01-11 16:56:35)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  12362 bytes, from 2014-01-07 14:47:36)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  56545 bytes, from 2014-02-26 16:32:11)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (   8344 bytes, from 2013-11-30 14:49:47)

 Copyright (C) 2013-2014 by the following authors:
 - Rob Clark <robdclark@gmail.com> (robclark)
@@ -203,15 +203,6 @@ enum a2xx_rb_copy_sample_select {
 	SAMPLE_0123 = 6,
 };

-enum a2xx_rb_blend_opcode {
-	BLEND_DST_PLUS_SRC = 0,
-	BLEND_SRC_MINUS_DST = 1,
-	BLEND_MIN_DST_SRC = 2,
-	BLEND_MAX_DST_SRC = 3,
-	BLEND_DST_MINUS_SRC = 4,
-	BLEND_DST_PLUS_SRC_BIAS = 5,
-};
-
 enum adreno_mmu_clnt_beh {
 	BEH_NEVR = 0,
 	BEH_TRAN_RNG = 1,
@@ -1005,7 +996,7 @@ static inline uint32_t A2XX_RB_BLEND_CONTROL_COLOR_SRCBLEND(enum adreno_rb_blend
 }
 #define A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN__MASK		0x000000e0
 #define A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN__SHIFT		5
-static inline uint32_t A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN(enum a2xx_rb_blend_opcode val)
+static inline uint32_t A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN(enum adreno_rb_blend_opcode val)
 {
 	return ((val) << A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN__SHIFT) & A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN__MASK;
 }
@@ -1023,7 +1014,7 @@ static inline uint32_t A2XX_RB_BLEND_CONTROL_ALPHA_SRCBLEND(enum adreno_rb_blend
 }
 #define A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN__MASK		0x00e00000
 #define A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN__SHIFT		21
-static inline uint32_t A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN(enum a2xx_rb_blend_opcode val)
+static inline uint32_t A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN(enum adreno_rb_blend_opcode val)
 {
 	return ((val) << A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN__SHIFT) & A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN__MASK;
 }
--- a/src/gallium/drivers/freedreno/a2xx/fd2_blend.c
+++ b/src/gallium/drivers/freedreno/a2xx/fd2_blend.c
@@ -34,27 +34,6 @@
 #include "fd2_context.h"
 #include "fd2_util.h"

-
-static enum a2xx_rb_blend_opcode
-blend_func(unsigned func)
-{
-	switch (func) {
-	case PIPE_BLEND_ADD:
-		return BLEND_DST_PLUS_SRC;
-	case PIPE_BLEND_MIN:
-		return BLEND_MIN_DST_SRC;
-	case PIPE_BLEND_MAX:
-		return BLEND_MAX_DST_SRC;
-	case PIPE_BLEND_SUBTRACT:
-		return BLEND_SRC_MINUS_DST;
-	case PIPE_BLEND_REVERSE_SUBTRACT:
-		return BLEND_DST_MINUS_SRC;
-	default:
-		DBG("invalid blend func: %x", func);
-		return 0;
-	}
-}
-
 void *
 fd2_blend_state_create(struct pipe_context *pctx,
 		const struct pipe_blend_state *cso)
@@ -82,10 +61,10 @@ fd2_blend_state_create(struct pipe_context *pctx,

 	so->rb_blendcontrol =
 		A2XX_RB_BLEND_CONTROL_COLOR_SRCBLEND(fd_blend_factor(rt->rgb_src_factor)) |
-		A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN(blend_func(rt->rgb_func)) |
+		A2XX_RB_BLEND_CONTROL_COLOR_COMB_FCN(fd_blend_func(rt->rgb_func)) |
 		A2XX_RB_BLEND_CONTROL_COLOR_DESTBLEND(fd_blend_factor(rt->rgb_dst_factor)) |
 		A2XX_RB_BLEND_CONTROL_ALPHA_SRCBLEND(fd_blend_factor(rt->alpha_src_factor)) |
-		A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN(blend_func(rt->alpha_func)) |
+		A2XX_RB_BLEND_CONTROL_ALPHA_COMB_FCN(fd_blend_func(rt->alpha_func)) |
 		A2XX_RB_BLEND_CONTROL_ALPHA_DESTBLEND(fd_blend_factor(rt->alpha_dst_factor));

 	if (rt->colormask & PIPE_MASK_R)
--- a/src/gallium/drivers/freedreno/a2xx/fd2_emit.c
+++ b/src/gallium/drivers/freedreno/a2xx/fd2_emit.c
@@ -125,7 +125,7 @@ emit_texture(struct fd_ringbuffer *ring, struct fd_context *ctx,
 {
 	unsigned const_idx = fd2_get_const_idx(ctx, tex, samp_id);
 	static const struct fd2_sampler_stateobj dummy_sampler = {};
-	const struct fd2_sampler_stateobj *sampler;
+	struct fd2_sampler_stateobj *sampler;
 	struct fd2_pipe_sampler_view *view;

 	if (emitted & (1 << const_idx))
--- a/src/gallium/drivers/freedreno/a3xx/a3xx.xml.h
+++ b/src/gallium/drivers/freedreno/a3xx/a3xx.xml.h
@@ -10,11 +10,11 @@ git clone https://github.com/freedreno/envytools.git
 The rules-ng-ng source files this header was generated from are:
 - /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    364 bytes, from 2013-11-30 14:47:15)
 - /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1453 bytes, from 2013-03-31 16:51:27)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32901 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9859 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  14477 bytes, from 2014-05-16 11:51:57)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  58020 bytes, from 2014-06-13 17:29:47)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (  26602 bytes, from 2014-06-13 17:28:10)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32840 bytes, from 2014-01-05 14:44:21)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9009 bytes, from 2014-01-11 16:56:35)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  12362 bytes, from 2014-01-07 14:47:36)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  56545 bytes, from 2014-02-26 16:32:11)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (   8344 bytes, from 2013-11-30 14:49:47)

 Copyright (C) 2013-2014 by the following authors:
 - Rob Clark <robdclark@gmail.com> (robclark)
@@ -41,11 +41,31 @@ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 */


+enum a3xx_render_mode {
+	RB_RENDERING_PASS = 0,
+	RB_TILING_PASS = 1,
+	RB_RESOLVE_PASS = 2,
+};
+
 enum a3xx_tile_mode {
 	LINEAR = 0,
 	TILE_32X32 = 2,
 };

+enum a3xx_threadmode {
+	MULTI = 0,
+	SINGLE = 1,
+};
+
+enum a3xx_instrbuffermode {
+	BUFFER = 1,
+};
+
+enum a3xx_threadsize {
+	TWO_QUADS = 0,
+	FOUR_QUADS = 1,
+};
+
 enum a3xx_state_block_id {
 	HLSQ_BLOCK_ID_TP_TEX = 2,
 	HLSQ_BLOCK_ID_TP_MIPMAP = 3,
@@ -160,6 +180,12 @@ enum a3xx_color_swap {
 	XYZW = 3,
 };

+enum a3xx_msaa_samples {
+	MSAA_ONE = 0,
+	MSAA_TWO = 1,
+	MSAA_FOUR = 2,
+};
+
 enum a3xx_sp_perfcounter_select {
 	SP_FS_CFLOW_INSTRUCTIONS = 12,
 	SP_FS_FULL_ALU_INSTRUCTIONS = 14,
@@ -186,26 +212,21 @@ enum a3xx_rop_code {
 	ROP_SET = 15,
 };

-enum a3xx_rb_blend_opcode {
-	BLEND_DST_PLUS_SRC = 0,
-	BLEND_SRC_MINUS_DST = 1,
-	BLEND_DST_MINUS_SRC = 2,
-	BLEND_MIN_DST_SRC = 3,
-	BLEND_MAX_DST_SRC = 4,
+enum adreno_rb_copy_control_mode {
+	RB_COPY_RESOLVE = 1,
+	RB_COPY_DEPTH_STENCIL = 5,
 };

 enum a3xx_tex_filter {
 	A3XX_TEX_NEAREST = 0,
 	A3XX_TEX_LINEAR = 1,
-	A3XX_TEX_ANISO = 2,
 };

 enum a3xx_tex_clamp {
 	A3XX_TEX_REPEAT = 0,
 	A3XX_TEX_CLAMP_TO_EDGE = 1,
 	A3XX_TEX_MIRROR_REPEAT = 2,
-	A3XX_TEX_CLAMP_TO_BORDER = 3,
-	A3XX_TEX_MIRROR_CLAMP = 4,
+	A3XX_TEX_CLAMP_NONE = 3,
 };

 enum a3xx_tex_swiz {
@@ -316,7 +337,6 @@ enum a3xx_tex_type {
 #define REG_A3XX_RBBM_INT_0_STATUS				0x00000064

 #define REG_A3XX_RBBM_PERFCTR_CTL				0x00000080
-#define A3XX_RBBM_PERFCTR_CTL_ENABLE				0x00000001

 #define REG_A3XX_RBBM_PERFCTR_LOAD_CMD0				0x00000081

@@ -550,10 +570,6 @@ static inline uint32_t REG_A3XX_CP_PROTECT_REG(uint32_t i0) { return 0x00000460

 #define REG_A3XX_CP_AHB_FAULT					0x0000054d

-#define REG_A3XX_SP_GLOBAL_MEM_SIZE				0x00000e22
-
-#define REG_A3XX_SP_GLOBAL_MEM_ADDR				0x00000e23
-
 #define REG_A3XX_GRAS_CL_CLIP_CNTL				0x00002040
 #define A3XX_GRAS_CL_CLIP_CNTL_IJ_PERSP_CENTER			0x00001000
 #define A3XX_GRAS_CL_CLIP_CNTL_CLIP_DISABLE			0x00010000
@@ -628,26 +644,8 @@ static inline uint32_t A3XX_GRAS_CL_VPORT_ZSCALE(float val)
 }

 #define REG_A3XX_GRAS_SU_POINT_MINMAX				0x00002068
-#define A3XX_GRAS_SU_POINT_MINMAX_MIN__MASK			0x0000ffff
-#define A3XX_GRAS_SU_POINT_MINMAX_MIN__SHIFT			0
-static inline uint32_t A3XX_GRAS_SU_POINT_MINMAX_MIN(float val)
-{
-	return ((((uint32_t)(val * 8.0))) << A3XX_GRAS_SU_POINT_MINMAX_MIN__SHIFT) & A3XX_GRAS_SU_POINT_MINMAX_MIN__MASK;
-}
-#define A3XX_GRAS_SU_POINT_MINMAX_MAX__MASK			0xffff0000
-#define A3XX_GRAS_SU_POINT_MINMAX_MAX__SHIFT			16
-static inline uint32_t A3XX_GRAS_SU_POINT_MINMAX_MAX(float val)
-{
-	return ((((uint32_t)(val * 8.0))) << A3XX_GRAS_SU_POINT_MINMAX_MAX__SHIFT) & A3XX_GRAS_SU_POINT_MINMAX_MAX__MASK;
-}

 #define REG_A3XX_GRAS_SU_POINT_SIZE				0x00002069
-#define A3XX_GRAS_SU_POINT_SIZE__MASK				0xffffffff
-#define A3XX_GRAS_SU_POINT_SIZE__SHIFT				0
-static inline uint32_t A3XX_GRAS_SU_POINT_SIZE(float val)
-{
-	return ((((uint32_t)(val * 8.0))) << A3XX_GRAS_SU_POINT_SIZE__SHIFT) & A3XX_GRAS_SU_POINT_SIZE__MASK;
-}

 #define REG_A3XX_GRAS_SU_POLY_OFFSET_SCALE			0x0000206c
 #define A3XX_GRAS_SU_POLY_OFFSET_SCALE_VAL__MASK		0x00ffffff
@@ -887,7 +885,7 @@ static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_RGB_SRC_FACTOR(enum adreno_rb_b
 }
 #define A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__MASK	0x000000e0
 #define A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__SHIFT	5
-static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(enum a3xx_rb_blend_opcode val)
+static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(enum adreno_rb_blend_opcode val)
 {
 	return ((val) << A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__SHIFT) & A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE__MASK;
 }
@@ -905,7 +903,7 @@ static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_ALPHA_SRC_FACTOR(enum adreno_rb
 }
 #define A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__MASK	0x00e00000
 #define A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__SHIFT	21
-static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(enum a3xx_rb_blend_opcode val)
+static inline uint32_t A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(enum adreno_rb_blend_opcode val)
 {
 	return ((val) << A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__SHIFT) & A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE__MASK;
 }
@@ -988,19 +986,12 @@ static inline uint32_t A3XX_RB_COPY_CONTROL_MSAA_RESOLVE(enum a3xx_msaa_samples
 {
 	return ((val) << A3XX_RB_COPY_CONTROL_MSAA_RESOLVE__SHIFT) & A3XX_RB_COPY_CONTROL_MSAA_RESOLVE__MASK;
 }
-#define A3XX_RB_COPY_CONTROL_DEPTHCLEAR				0x00000008
 #define A3XX_RB_COPY_CONTROL_MODE__MASK				0x00000070
 #define A3XX_RB_COPY_CONTROL_MODE__SHIFT			4
 static inline uint32_t A3XX_RB_COPY_CONTROL_MODE(enum adreno_rb_copy_control_mode val)
 {
 	return ((val) << A3XX_RB_COPY_CONTROL_MODE__SHIFT) & A3XX_RB_COPY_CONTROL_MODE__MASK;
 }
-#define A3XX_RB_COPY_CONTROL_FASTCLEAR__MASK			0x00000f00
-#define A3XX_RB_COPY_CONTROL_FASTCLEAR__SHIFT			8
-static inline uint32_t A3XX_RB_COPY_CONTROL_FASTCLEAR(uint32_t val)
-{
-	return ((val) << A3XX_RB_COPY_CONTROL_FASTCLEAR__SHIFT) & A3XX_RB_COPY_CONTROL_FASTCLEAR__MASK;
-}
 #define A3XX_RB_COPY_CONTROL_GMEM_BASE__MASK			0xffffc000
 #define A3XX_RB_COPY_CONTROL_GMEM_BASE__SHIFT			14
 static inline uint32_t A3XX_RB_COPY_CONTROL_GMEM_BASE(uint32_t val)
@@ -1043,12 +1034,6 @@ static inline uint32_t A3XX_RB_COPY_DEST_INFO_SWAP(enum a3xx_color_swap val)
 {
 	return ((val) << A3XX_RB_COPY_DEST_INFO_SWAP__SHIFT) & A3XX_RB_COPY_DEST_INFO_SWAP__MASK;
 }
-#define A3XX_RB_COPY_DEST_INFO_DITHER_MODE__MASK		0x00000c00
-#define A3XX_RB_COPY_DEST_INFO_DITHER_MODE__SHIFT		10
-static inline uint32_t A3XX_RB_COPY_DEST_INFO_DITHER_MODE(enum adreno_rb_dither_mode val)
-{
-	return ((val) << A3XX_RB_COPY_DEST_INFO_DITHER_MODE__SHIFT) & A3XX_RB_COPY_DEST_INFO_DITHER_MODE__MASK;
-}
 #define A3XX_RB_COPY_DEST_INFO_COMPONENT_ENABLE__MASK		0x0003c000
 #define A3XX_RB_COPY_DEST_INFO_COMPONENT_ENABLE__SHIFT		14
 static inline uint32_t A3XX_RB_COPY_DEST_INFO_COMPONENT_ENABLE(uint32_t val)
@@ -1089,7 +1074,7 @@ static inline uint32_t A3XX_RB_DEPTH_INFO_DEPTH_FORMAT(enum adreno_rb_depth_form
 #define A3XX_RB_DEPTH_INFO_DEPTH_BASE__SHIFT			11
 static inline uint32_t A3XX_RB_DEPTH_INFO_DEPTH_BASE(uint32_t val)
 {
-	return ((val >> 12) << A3XX_RB_DEPTH_INFO_DEPTH_BASE__SHIFT) & A3XX_RB_DEPTH_INFO_DEPTH_BASE__MASK;
+	return ((val >> 10) << A3XX_RB_DEPTH_INFO_DEPTH_BASE__SHIFT) & A3XX_RB_DEPTH_INFO_DEPTH_BASE__MASK;
 }

 #define REG_A3XX_RB_DEPTH_PITCH					0x00002103
@@ -1217,8 +1202,6 @@ static inline uint32_t A3XX_RB_WINDOW_OFFSET_Y(uint32_t val)
 }

 #define REG_A3XX_RB_SAMPLE_COUNT_CONTROL			0x00002110
-#define A3XX_RB_SAMPLE_COUNT_CONTROL_RESET			0x00000001
-#define A3XX_RB_SAMPLE_COUNT_CONTROL_COPY			0x00000002

 #define REG_A3XX_RB_SAMPLE_COUNT_ADDR				0x00002111

@@ -1383,36 +1366,10 @@ static inline uint32_t A3XX_HLSQ_CONST_FSPRESV_RANGE_REG_ENDENTRY(uint32_t val)
 }

 #define REG_A3XX_HLSQ_CL_NDRANGE_0_REG				0x0000220a
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_WORKDIM__MASK		0x00000003
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_WORKDIM__SHIFT		0
-static inline uint32_t A3XX_HLSQ_CL_NDRANGE_0_REG_WORKDIM(uint32_t val)
-{
-	return ((val) << A3XX_HLSQ_CL_NDRANGE_0_REG_WORKDIM__SHIFT) & A3XX_HLSQ_CL_NDRANGE_0_REG_WORKDIM__MASK;
-}
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE0__MASK		0x00000ffc
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE0__SHIFT		2
-static inline uint32_t A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE0(uint32_t val)
-{
-	return ((val) << A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE0__SHIFT) & A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE0__MASK;
-}
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE1__MASK		0x003ff000
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE1__SHIFT		12
-static inline uint32_t A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE1(uint32_t val)
-{
-	return ((val) << A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE1__SHIFT) & A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE1__MASK;
-}
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE2__MASK		0xffc00000
-#define A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE2__SHIFT		22
-static inline uint32_t A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE2(uint32_t val)
-{
-	return ((val) << A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE2__SHIFT) & A3XX_HLSQ_CL_NDRANGE_0_REG_LOCALSIZE2__MASK;
-}

-static inline uint32_t REG_A3XX_HLSQ_CL_GLOBAL_WORK(uint32_t i0) { return 0x0000220b + 0x2*i0; }
+#define REG_A3XX_HLSQ_CL_NDRANGE_1_REG				0x0000220b

-static inline uint32_t REG_A3XX_HLSQ_CL_GLOBAL_WORK_SIZE(uint32_t i0) { return 0x0000220b + 0x2*i0; }
-
-static inline uint32_t REG_A3XX_HLSQ_CL_GLOBAL_WORK_OFFSET(uint32_t i0) { return 0x0000220c + 0x2*i0; }
+#define REG_A3XX_HLSQ_CL_NDRANGE_2_REG				0x0000220c

 #define REG_A3XX_HLSQ_CL_CONTROL_0_REG				0x00002211

@@ -1420,9 +1377,7 @@ static inline uint32_t REG_A3XX_HLSQ_CL_GLOBAL_WORK_OFFSET(uint32_t i0) { return

 #define REG_A3XX_HLSQ_CL_KERNEL_CONST_REG			0x00002214

-static inline uint32_t REG_A3XX_HLSQ_CL_KERNEL_GROUP(uint32_t i0) { return 0x00002215 + 0x1*i0; }
-
-static inline uint32_t REG_A3XX_HLSQ_CL_KERNEL_GROUP_RATIO(uint32_t i0) { return 0x00002215 + 0x1*i0; }
+#define REG_A3XX_HLSQ_CL_KERNEL_GROUP_X_REG			0x00002215

 #define REG_A3XX_HLSQ_CL_KERNEL_GROUP_Y_REG			0x00002216

@@ -1537,12 +1492,6 @@ static inline uint32_t A3XX_VFD_DECODE_INSTR_REGID(uint32_t val)
 {
 	return ((val) << A3XX_VFD_DECODE_INSTR_REGID__SHIFT) & A3XX_VFD_DECODE_INSTR_REGID__MASK;
 }
-#define A3XX_VFD_DECODE_INSTR_SWAP__MASK			0x00c00000
-#define A3XX_VFD_DECODE_INSTR_SWAP__SHIFT			22
-static inline uint32_t A3XX_VFD_DECODE_INSTR_SWAP(enum a3xx_color_swap val)
-{
-	return ((val) << A3XX_VFD_DECODE_INSTR_SWAP__SHIFT) & A3XX_VFD_DECODE_INSTR_SWAP__MASK;
-}
 #define A3XX_VFD_DECODE_INSTR_SHIFTCNT__MASK			0x1f000000
 #define A3XX_VFD_DECODE_INSTR_SHIFTCNT__SHIFT			24
 static inline uint32_t A3XX_VFD_DECODE_INSTR_SHIFTCNT(uint32_t val)
@@ -1675,7 +1624,6 @@ static inline uint32_t A3XX_SP_VS_CTRL_REG0_THREADSIZE(enum a3xx_threadsize val)
 }
 #define A3XX_SP_VS_CTRL_REG0_SUPERTHREADMODE			0x00200000
 #define A3XX_SP_VS_CTRL_REG0_PIXLODENABLE			0x00400000
-#define A3XX_SP_VS_CTRL_REG0_COMPUTEMODE			0x00800000
 #define A3XX_SP_VS_CTRL_REG0_LENGTH__MASK			0xff000000
 #define A3XX_SP_VS_CTRL_REG0_LENGTH__SHIFT			24
 static inline uint32_t A3XX_SP_VS_CTRL_REG0_LENGTH(uint32_t val)
@@ -1849,7 +1797,6 @@ static inline uint32_t A3XX_SP_FS_CTRL_REG0_THREADSIZE(enum a3xx_threadsize val)
 }
 #define A3XX_SP_FS_CTRL_REG0_SUPERTHREADMODE			0x00200000
 #define A3XX_SP_FS_CTRL_REG0_PIXLODENABLE			0x00400000
-#define A3XX_SP_FS_CTRL_REG0_COMPUTEMODE			0x00800000
 #define A3XX_SP_FS_CTRL_REG0_LENGTH__MASK			0xff000000
 #define A3XX_SP_FS_CTRL_REG0_LENGTH__SHIFT			24
 static inline uint32_t A3XX_SP_FS_CTRL_REG0_LENGTH(uint32_t val)
@@ -2029,42 +1976,6 @@ static inline uint32_t A3XX_TPL1_TP_FS_TEX_OFFSET_BASETABLEPTR(uint32_t val)

 #define REG_A3XX_VBIF_OUT_AXI_AOOO				0x0000305f

-#define REG_A3XX_VBIF_PERF_CNT_EN				0x00003070
-#define A3XX_VBIF_PERF_CNT_EN_CNT0				0x00000001
-#define A3XX_VBIF_PERF_CNT_EN_CNT1				0x00000002
-#define A3XX_VBIF_PERF_CNT_EN_PWRCNT0				0x00000004
-#define A3XX_VBIF_PERF_CNT_EN_PWRCNT1				0x00000008
-#define A3XX_VBIF_PERF_CNT_EN_PWRCNT2				0x00000010
-
-#define REG_A3XX_VBIF_PERF_CNT_CLR				0x00003071
-#define A3XX_VBIF_PERF_CNT_CLR_CNT0				0x00000001
-#define A3XX_VBIF_PERF_CNT_CLR_CNT1				0x00000002
-#define A3XX_VBIF_PERF_CNT_CLR_PWRCNT0				0x00000004
-#define A3XX_VBIF_PERF_CNT_CLR_PWRCNT1				0x00000008
-#define A3XX_VBIF_PERF_CNT_CLR_PWRCNT2				0x00000010
-
-#define REG_A3XX_VBIF_PERF_CNT_SEL				0x00003072
-
-#define REG_A3XX_VBIF_PERF_CNT0_LO				0x00003073
-
-#define REG_A3XX_VBIF_PERF_CNT0_HI				0x00003074
-
-#define REG_A3XX_VBIF_PERF_CNT1_LO				0x00003075
-
-#define REG_A3XX_VBIF_PERF_CNT1_HI				0x00003076
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT0_LO				0x00003077
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT0_HI				0x00003078
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT1_LO				0x00003079
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT1_HI				0x0000307a
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT2_LO				0x0000307b
-
-#define REG_A3XX_VBIF_PERF_PWR_CNT2_HI				0x0000307c
-
 #define REG_A3XX_VSC_BIN_SIZE					0x00000c01
 #define A3XX_VSC_BIN_SIZE_WIDTH__MASK				0x0000001f
 #define A3XX_VSC_BIN_SIZE_WIDTH__SHIFT				0
@@ -2338,12 +2249,6 @@ static inline uint32_t A3XX_TEX_SAMP_0_WRAP_R(enum a3xx_tex_clamp val)
 {
 	return ((val) << A3XX_TEX_SAMP_0_WRAP_R__SHIFT) & A3XX_TEX_SAMP_0_WRAP_R__MASK;
 }
-#define A3XX_TEX_SAMP_0_COMPARE_FUNC__MASK			0x00700000
-#define A3XX_TEX_SAMP_0_COMPARE_FUNC__SHIFT			20
-static inline uint32_t A3XX_TEX_SAMP_0_COMPARE_FUNC(enum adreno_compare_func val)
-{
-	return ((val) << A3XX_TEX_SAMP_0_COMPARE_FUNC__SHIFT) & A3XX_TEX_SAMP_0_COMPARE_FUNC__MASK;
-}
 #define A3XX_TEX_SAMP_0_UNNORM_COORDS				0x80000000

 #define REG_A3XX_TEX_SAMP_1					0x00000001
@@ -2362,7 +2267,6 @@ static inline uint32_t A3XX_TEX_SAMP_1_MIN_LOD(float val)

 #define REG_A3XX_TEX_CONST_0					0x00000000
 #define A3XX_TEX_CONST_0_TILED					0x00000001
-#define A3XX_TEX_CONST_0_SRGB					0x00000004
 #define A3XX_TEX_CONST_0_SWIZ_X__MASK				0x00000070
 #define A3XX_TEX_CONST_0_SWIZ_X__SHIFT				4
 static inline uint32_t A3XX_TEX_CONST_0_SWIZ_X(enum a3xx_tex_swiz val)
@@ -2399,7 +2303,6 @@ static inline uint32_t A3XX_TEX_CONST_0_FMT(enum a3xx_tex_fmt val)
 {
 	return ((val) << A3XX_TEX_CONST_0_FMT__SHIFT) & A3XX_TEX_CONST_0_FMT__MASK;
 }
-#define A3XX_TEX_CONST_0_NOCONVERT				0x20000000
 #define A3XX_TEX_CONST_0_TYPE__MASK				0xc0000000
 #define A3XX_TEX_CONST_0_TYPE__SHIFT				30
 static inline uint32_t A3XX_TEX_CONST_0_TYPE(enum a3xx_tex_type val)
--- a/src/gallium/drivers/freedreno/a3xx/fd3_blend.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_blend.c
@@ -34,27 +34,6 @@
 #include "fd3_context.h"
 #include "fd3_util.h"

-
-static enum a3xx_rb_blend_opcode
-blend_func(unsigned func)
-{
-	switch (func) {
-	case PIPE_BLEND_ADD:
-		return BLEND_DST_PLUS_SRC;
-	case PIPE_BLEND_MIN:
-		return BLEND_MIN_DST_SRC;
-	case PIPE_BLEND_MAX:
-		return BLEND_MAX_DST_SRC;
-	case PIPE_BLEND_SUBTRACT:
-		return BLEND_SRC_MINUS_DST;
-	case PIPE_BLEND_REVERSE_SUBTRACT:
-		return BLEND_DST_MINUS_SRC;
-	default:
-		DBG("invalid blend func: %x", func);
-		return 0;
-	}
-}
-
 void *
 fd3_blend_state_create(struct pipe_context *pctx,
 		const struct pipe_blend_state *cso)
@@ -101,10 +80,10 @@ fd3_blend_state_create(struct pipe_context *pctx,

 		so->rb_mrt[i].blend_control =
 				A3XX_RB_MRT_BLEND_CONTROL_RGB_SRC_FACTOR(fd_blend_factor(rt->rgb_src_factor)) |
-				A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(blend_func(rt->rgb_func)) |
+				A3XX_RB_MRT_BLEND_CONTROL_RGB_BLEND_OPCODE(fd_blend_func(rt->rgb_func)) |
 				A3XX_RB_MRT_BLEND_CONTROL_RGB_DEST_FACTOR(fd_blend_factor(rt->rgb_dst_factor)) |
 				A3XX_RB_MRT_BLEND_CONTROL_ALPHA_SRC_FACTOR(fd_blend_factor(rt->alpha_src_factor)) |
-				A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(blend_func(rt->alpha_func)) |
+				A3XX_RB_MRT_BLEND_CONTROL_ALPHA_BLEND_OPCODE(fd_blend_func(rt->alpha_func)) |
 				A3XX_RB_MRT_BLEND_CONTROL_ALPHA_DEST_FACTOR(fd_blend_factor(rt->alpha_dst_factor)) |
 				A3XX_RB_MRT_BLEND_CONTROL_CLAMP_ENABLE;

--- a/src/gallium/drivers/freedreno/a3xx/fd3_compiler.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_compiler.c
@@ -1074,154 +1074,77 @@ trans_arl(const struct instr_translater *t,
 	add_src_reg(ctx, instr, tmp_src, chan)->flags |= IR3_REG_HALF;
 }

-/*
- * texture fetch/sample instructions:
- */
-
-struct tex_info {
-	int8_t order[4];
-	unsigned src_wrmask, flags;
-};
-
-static const struct tex_info *
-get_tex_info(struct fd3_compile_context *ctx,
+/* texture fetch/sample instructions: */
+static void
+trans_samp(const struct instr_translater *t,
+		struct fd3_compile_context *ctx,
 		struct tgsi_full_instruction *inst)
 {
-	static const struct tex_info tex1d = {
-		.order = { 0, -1, -1, -1 },  /* coord.x */
-		.src_wrmask = TGSI_WRITEMASK_XY,
-		.flags = 0,
-	};
-	static const struct tex_info tex1ds = {
-		.order = { 0, -1,  2, -1 },  /* coord.xz */
-		.src_wrmask = TGSI_WRITEMASK_XYZ,
-		.flags = IR3_INSTR_S,
-	};
-	static const struct tex_info tex2d = {
-		.order = { 0,  1, -1, -1 },  /* coord.xy */
-		.src_wrmask = TGSI_WRITEMASK_XY,
-		.flags = 0,
-	};
-	static const struct tex_info tex2ds = {
-		.order = { 0,  1,  2, -1 },  /* coord.xyz */
-		.src_wrmask = TGSI_WRITEMASK_XYZ,
-		.flags = IR3_INSTR_S,
-	};
-	static const struct tex_info tex3d = {
-		.order = { 0,  1,  2, -1 },  /* coord.xyz */
-		.src_wrmask = TGSI_WRITEMASK_XYZ,
-		.flags = IR3_INSTR_3D,
-	};
-	static const struct tex_info tex3ds = {
-		.order = { 0,  1,  2,  3 },  /* coord.xyzw */
-		.src_wrmask = TGSI_WRITEMASK_XYZW,
-		.flags = IR3_INSTR_S | IR3_INSTR_3D,
-	};
-	static const struct tex_info txp1d = {
-		.order = { 0, -1,  3, -1 },  /* coord.xw */
-		.src_wrmask = TGSI_WRITEMASK_XYZ,
-		.flags = IR3_INSTR_P,
-	};
-	static const struct tex_info txp1ds = {
-		.order = { 0, -1,  2,  3 },  /* coord.xzw */
-		.src_wrmask = TGSI_WRITEMASK_XYZW,
-		.flags = IR3_INSTR_P | IR3_INSTR_S,
-	};
-	static const struct tex_info txp2d = {
-		.order = { 0,  1,  3, -1 },  /* coord.xyw */
-		.src_wrmask = TGSI_WRITEMASK_XYZ,
-		.flags = IR3_INSTR_P,
-	};
-	static const struct tex_info txp2ds = {
-		.order = { 0,  1,  2,  3 },  /* coord.xyzw */
-		.src_wrmask = TGSI_WRITEMASK_XYZW,
-		.flags = IR3_INSTR_P | IR3_INSTR_S,
-	};
-	static const struct tex_info txp3d = {
-		.order = { 0,  1,  2,  3 },  /* coord.xyzw */
-		.src_wrmask = TGSI_WRITEMASK_XYZW,
-		.flags = IR3_INSTR_P | IR3_INSTR_3D,
-	};
-
+	struct ir3_instruction *instr;
+	struct tgsi_src_register *coord = &inst->Src[0].Register;
+	struct tgsi_src_register *samp  = &inst->Src[1].Register;
 	unsigned tex = inst->Texture.Texture;
+	int8_t *order;
+	unsigned i, flags = 0, src_wrmask;
+	bool needs_mov = false;

-	switch (inst->Instruction.Opcode) {
+	switch (t->arg) {
 	case TGSI_OPCODE_TEX:
 		switch (tex) {
-		case TGSI_TEXTURE_1D:
-			return &tex1d;
-		case TGSI_TEXTURE_SHADOW1D:
-			return &tex1ds;
 		case TGSI_TEXTURE_2D:
 		case TGSI_TEXTURE_RECT:
-			return &tex2d;
-		case TGSI_TEXTURE_SHADOW2D:
-		case TGSI_TEXTURE_SHADOWRECT:
-			return &tex2ds;
+			order = (int8_t[4]){ 0,  1, -1, -1 };
+			src_wrmask = TGSI_WRITEMASK_XY;
+			break;
 		case TGSI_TEXTURE_3D:
 		case TGSI_TEXTURE_CUBE:
-			return &tex3d;
-		case TGSI_TEXTURE_SHADOWCUBE:
-			return &tex3ds;
-		default:
-			compile_error(ctx, "unknown texture type: %s\n",
-					tgsi_texture_names[tex]);
-			return NULL;
-		}
-		break;
-	case TGSI_OPCODE_TXP:
-		switch (tex) {
-		case TGSI_TEXTURE_1D:
-			return &txp1d;
-		case TGSI_TEXTURE_SHADOW1D:
-			return &txp1ds;
-		case TGSI_TEXTURE_2D:
-		case TGSI_TEXTURE_RECT:
-			return &txp2d;
-		case TGSI_TEXTURE_SHADOW2D:
-		case TGSI_TEXTURE_SHADOWRECT:
-			return &txp2ds;
-		case TGSI_TEXTURE_3D:
-		case TGSI_TEXTURE_CUBE:
-			return &txp3d;
+			order = (int8_t[4]){ 0,  1,  2, -1 };
+			src_wrmask = TGSI_WRITEMASK_XYZ;
+			flags |= IR3_INSTR_3D;
+			break;
 		default:
 			compile_error(ctx, "unknown texture type: %s\n",
 					tgsi_texture_names[tex]);
 			break;
 		}
 		break;
+	case TGSI_OPCODE_TXP:
+		switch (tex) {
+		case TGSI_TEXTURE_2D:
+		case TGSI_TEXTURE_RECT:
+			order = (int8_t[4]){ 0,  1,  3, -1 };
+			src_wrmask = TGSI_WRITEMASK_XYZ;
+			break;
+		case TGSI_TEXTURE_3D:
+		case TGSI_TEXTURE_CUBE:
+			order = (int8_t[4]){ 0,  1,  2,  3 };
+			src_wrmask = TGSI_WRITEMASK_XYZW;
+			flags |= IR3_INSTR_3D;
+			break;
+		default:
+			compile_error(ctx, "unknown texture type: %s\n",
+					tgsi_texture_names[tex]);
+			break;
+		}
+		flags |= IR3_INSTR_P;
+		break;
+	default:
+		compile_assert(ctx, 0);
+		break;
 	}
-	compile_assert(ctx, 0);
-	return NULL;
-}
-
-static struct tgsi_src_register *
-get_tex_coord(struct fd3_compile_context *ctx,
-		struct tgsi_full_instruction *inst,
-		const struct tex_info *tinf)
-{
-	struct tgsi_src_register *coord = &inst->Src[0].Register;
-	struct ir3_instruction *instr;
-	unsigned tex = inst->Texture.Texture;
-	bool needs_mov = false;
-	unsigned i;

 	/* cat5 instruction cannot seem to handle const or relative: */
 	if (is_rel_or_const(coord))
 		needs_mov = true;

-	/* 1D textures we fix up w/ 0.0 as 2nd coord: */
-	if ((tex == TGSI_TEXTURE_1D) || (tex == TGSI_TEXTURE_SHADOW1D))
-		needs_mov = true;
-
 	/* The texture sample instructions need to coord in successive
 	 * registers/components (ie. src.xy but not src.yx).  And TXP
 	 * needs the .w component in .z for 2D..  so in some cases we
 	 * might need to emit some mov instructions to shuffle things
 	 * around:
 	 */
-	for (i = 1; (i < 4) && (tinf->order[i] >= 0) && !needs_mov; i++)
-		if (src_swiz(coord, i) != (src_swiz(coord, 0) + tinf->order[i]))
+	for (i = 1; (i < 4) && (order[i] >= 0) && !needs_mov; i++)
+		if (src_swiz(coord, i) != (src_swiz(coord, 0) + order[i]))
 			needs_mov = true;

 	if (needs_mov) {
@@ -1234,55 +1157,28 @@ get_tex_coord(struct fd3_compile_context *ctx,
 		/* need to move things around: */
 		tmp_src = get_internal_temp(ctx, &tmp_dst);

-		for (j = 0; j < 4; j++) {
-			if (tinf->order[j] < 0)
-				continue;
-			instr = instr_create(ctx, 1, 0);  /* mov */
+		for (j = 0; (j < 4) && (order[j] >= 0); j++) {
+			instr = instr_create(ctx, 1, 0);
 			instr->cat1.src_type = type_mov;
 			instr->cat1.dst_type = type_mov;
 			add_dst_reg(ctx, instr, &tmp_dst, j);
 			add_src_reg(ctx, instr, coord,
-					src_swiz(coord, tinf->order[j]));
-		}
-
-		/* fix up .y coord: */
-		if ((tex == TGSI_TEXTURE_1D) ||
-				(tex == TGSI_TEXTURE_SHADOW1D)) {
-			instr = instr_create(ctx, 1, 0);  /* mov */
-			instr->cat1.src_type = type_mov;
-			instr->cat1.dst_type = type_mov;
-			add_dst_reg(ctx, instr, &tmp_dst, 1);  /* .y */
-			ir3_reg_create(instr, 0, IR3_REG_IMMED)->fim_val = 0.5;
+					src_swiz(coord, order[j]));
 		}

 		coord = tmp_src;
 	}

-	return coord;
-}
-
-static void
-trans_samp(const struct instr_translater *t,
-		struct fd3_compile_context *ctx,
-		struct tgsi_full_instruction *inst)
-{
-	struct ir3_instruction *instr;
-	struct tgsi_dst_register *dst = &inst->Dst[0].Register;
-	struct tgsi_src_register *coord;
-	struct tgsi_src_register *samp  = &inst->Src[1].Register;
-	const struct tex_info *tinf;
-
-	tinf = get_tex_info(ctx, inst);
-	coord = get_tex_coord(ctx, inst, tinf);
-
 	instr = instr_create(ctx, 5, t->opc);
 	instr->cat5.type = get_ftype(ctx);
 	instr->cat5.samp = samp->Index;
 	instr->cat5.tex  = samp->Index;
-	instr->flags |= tinf->flags;
+	instr->flags |= flags;

-	add_dst_reg_wrmask(ctx, instr, dst, 0, dst->WriteMask);
-	add_src_reg_wrmask(ctx, instr, coord, coord->SwizzleX, tinf->src_wrmask);
+	add_dst_reg_wrmask(ctx, instr, &inst->Dst[0].Register, 0,
+			inst->Dst[0].Register.WriteMask);
+
+	add_src_reg_wrmask(ctx, instr, coord, coord->SwizzleX, src_wrmask);
 }

 /*
@@ -1335,19 +1231,15 @@ trans_cmp(const struct instr_translater *t,

 	switch (t->tgsi_opc) {
 	case TGSI_OPCODE_SEQ:
-	case TGSI_OPCODE_FSEQ:
 		condition = IR3_COND_EQ;
 		break;
 	case TGSI_OPCODE_SNE:
-	case TGSI_OPCODE_FSNE:
 		condition = IR3_COND_NE;
 		break;
 	case TGSI_OPCODE_SGE:
-	case TGSI_OPCODE_FSGE:
 		condition = IR3_COND_GE;
 		break;
 	case TGSI_OPCODE_SLT:
-	case TGSI_OPCODE_FSLT:
 		condition = IR3_COND_LT;
 		break;
 	case TGSI_OPCODE_SLE:
@@ -1377,15 +1269,11 @@ trans_cmp(const struct instr_translater *t,

 	switch (t->tgsi_opc) {
 	case TGSI_OPCODE_SEQ:
-	case TGSI_OPCODE_FSEQ:
 	case TGSI_OPCODE_SGE:
-	case TGSI_OPCODE_FSGE:
 	case TGSI_OPCODE_SLE:
 	case TGSI_OPCODE_SNE:
-	case TGSI_OPCODE_FSNE:
 	case TGSI_OPCODE_SGT:
 	case TGSI_OPCODE_SLT:
-	case TGSI_OPCODE_FSLT:
 		/* cov.u16f16 dst, tmp0 */
 		instr = instr_create(ctx, 1, 0);
 		instr->cat1.src_type = get_utype(ctx);
@@ -1405,96 +1293,6 @@ trans_cmp(const struct instr_translater *t,
 	put_dst(ctx, inst, dst);
 }

-/*
- * USNE(a,b) = (a != b) ? 1 : 0
- *   cmps.u32.ne dst, a, b
- *
- * USEQ(a,b) = (a == b) ? 1 : 0
- *   cmps.u32.eq dst, a, b
- *
- * ISGE(a,b) = (a > b) ? 1 : 0
- *   cmps.s32.ge dst, a, b
- *
- * USGE(a,b) = (a > b) ? 1 : 0
- *   cmps.u32.ge dst, a, b
- *
- * ISLT(a,b) = (a < b) ? 1 : 0
- *   cmps.s32.lt dst, a, b
- *
- * USLT(a,b) = (a < b) ? 1 : 0
- *   cmps.u32.lt dst, a, b
- *
- * UCMP(a,b,c) = (a < 0) ? b : c
- *   cmps.u32.lt tmp0, a, {0}
- *   sel.b16 dst, b, tmp0, c
- */
-static void
-trans_icmp(const struct instr_translater *t,
-		struct fd3_compile_context *ctx,
-		struct tgsi_full_instruction *inst)
-{
-	struct ir3_instruction *instr;
-	struct tgsi_dst_register *dst = get_dst(ctx, inst);
-	struct tgsi_src_register constval0;
-	struct tgsi_src_register *a0, *a1, *a2;
-	unsigned condition;
-
-	a0 = &inst->Src[0].Register;  /* a */
-	a1 = &inst->Src[1].Register;  /* b */
-
-	switch (t->tgsi_opc) {
-	case TGSI_OPCODE_USNE:
-		condition = IR3_COND_NE;
-		break;
-	case TGSI_OPCODE_USEQ:
-		condition = IR3_COND_EQ;
-		break;
-	case TGSI_OPCODE_ISGE:
-	case TGSI_OPCODE_USGE:
-		condition = IR3_COND_GE;
-		break;
-	case TGSI_OPCODE_ISLT:
-	case TGSI_OPCODE_USLT:
-		condition = IR3_COND_LT;
-		break;
-	case TGSI_OPCODE_UCMP:
-		get_immediate(ctx, &constval0, 0);
-		a0 = &inst->Src[0].Register;  /* a */
-		a1 = &constval0;              /* {0} */
-		condition = IR3_COND_LT;
-		break;
-
-	default:
-		compile_assert(ctx, 0);
-		return;
-	}
-
-	if (is_const(a0) && is_const(a1))
-		a0 = get_unconst(ctx, a0);
-
-	if (t->tgsi_opc == TGSI_OPCODE_UCMP) {
-		struct tgsi_dst_register tmp_dst;
-		struct tgsi_src_register *tmp_src;
-		tmp_src = get_internal_temp(ctx, &tmp_dst);
-		/* cmps.u32.lt tmp, a0, a1 */
-		instr = instr_create(ctx, 2, t->opc);
-		instr->cat2.condition = condition;
-		vectorize(ctx, instr, &tmp_dst, 2, a0, 0, a1, 0);
-
-		a1 = &inst->Src[1].Register;
-		a2 = &inst->Src[2].Register;
-		/* sel.{b32,b16} dst, src2, tmp, src1 */
-		instr = instr_create(ctx, 3, OPC_SEL_B32);
-		vectorize(ctx, instr, dst, 3, a1, 0, tmp_src, 0, a2, 0);
-	} else {
-		/* cmps.{u32,s32}.<cond> dst, a0, a1 */
-		instr = instr_create(ctx, 2, t->opc);
-		instr->cat2.condition = condition;
-		vectorize(ctx, instr, dst, 2, a0, 0, a1, 0);
-	}
-	put_dst(ctx, inst, dst);
-}
-
 /*
 * Conditional / Flow control
 */
@@ -1735,7 +1533,7 @@ trans_endif(const struct instr_translater *t,
 }

 /*
- * Kill
+ * Kill / Kill-if
 */

 static void
@@ -1781,76 +1579,6 @@ trans_kill(const struct instr_translater *t,
 	ctx->kill[ctx->kill_count++] = instr;
 }

-/*
- * Kill-If
- */
-
-static void
-trans_killif(const struct instr_translater *t,
-		struct fd3_compile_context *ctx,
-		struct tgsi_full_instruction *inst)
-{
-	struct tgsi_src_register *src = &inst->Src[0].Register;
-	struct ir3_instruction *instr, *immed, *cond = NULL;
-	bool inv = false;
-
-	immed = create_immed(ctx, 0.0);
-
-	/* cmps.f.ne p0.x, cond, {0.0} */
-	instr = instr_create(ctx, 2, OPC_CMPS_F);
-	instr->cat2.condition = IR3_COND_NE;
-	ir3_reg_create(instr, regid(REG_P0, 0), 0);
-	ir3_reg_create(instr, 0, IR3_REG_SSA)->instr = immed;
-	add_src_reg(ctx, instr, src, src->SwizzleX);
-
-	cond = instr;
-
-	/* kill p0.x */
-	instr = instr_create(ctx, 0, OPC_KILL);
-	instr->cat0.inv = inv;
-	ir3_reg_create(instr, 0, 0);  /* dummy dst */
-	ir3_reg_create(instr, 0, IR3_REG_SSA)->instr = cond;
-
-	ctx->kill[ctx->kill_count++] = instr;
-
-}
-/*
- * I2F / U2F / F2I / F2U
- */
-
-static void
-trans_cov(const struct instr_translater *t,
-		struct fd3_compile_context *ctx,
-		struct tgsi_full_instruction *inst)
-{
-	struct ir3_instruction *instr;
-	struct tgsi_dst_register *dst = get_dst(ctx, inst);
-	struct tgsi_src_register *src = &inst->Src[0].Register;
-
-	// cov.f32s32 dst, tmp0 /
-	instr = instr_create(ctx, 1, 0);
-	switch (t->tgsi_opc) {
-	case TGSI_OPCODE_U2F:
-		instr->cat1.src_type = TYPE_U32;
-		instr->cat1.dst_type = TYPE_F32;
-		break;
-	case TGSI_OPCODE_I2F:
-		instr->cat1.src_type = TYPE_S32;
-		instr->cat1.dst_type = TYPE_F32;
-		break;
-	case TGSI_OPCODE_F2U:
-		instr->cat1.src_type = TYPE_F32;
-		instr->cat1.dst_type = TYPE_U32;
-		break;
-	case TGSI_OPCODE_F2I:
-		instr->cat1.src_type = TYPE_F32;
-		instr->cat1.dst_type = TYPE_S32;
-		break;
-
-	}
-	vectorize(ctx, instr, dst, 1, src, 0);
-}
-
 /*
 * Handlers for TGSI instructions which do have 1:1 mapping to native
 * instructions:
@@ -1888,11 +1616,9 @@ instr_cat2(const struct instr_translater *t,

 	switch (t->tgsi_opc) {
 	case TGSI_OPCODE_ABS:
-	case TGSI_OPCODE_IABS:
 		src0_flags = IR3_REG_ABS;
 		break;
 	case TGSI_OPCODE_SUB:
-	case TGSI_OPCODE_INEG:
 		src1_flags = IR3_REG_NEGATE;
 		break;
 	}
@@ -1998,22 +1724,6 @@ static const struct instr_translater translaters[TGSI_OPCODE_LAST] = {
 	INSTR(SUB,          instr_cat2, .opc = OPC_ADD_F),
 	INSTR(MIN,          instr_cat2, .opc = OPC_MIN_F),
 	INSTR(MAX,          instr_cat2, .opc = OPC_MAX_F),
-	INSTR(UADD,         instr_cat2, .opc = OPC_ADD_U),
-	INSTR(IMIN,         instr_cat2, .opc = OPC_MIN_S),
-	INSTR(UMIN,         instr_cat2, .opc = OPC_MIN_U),
-	INSTR(IMAX,         instr_cat2, .opc = OPC_MAX_S),
-	INSTR(UMAX,         instr_cat2, .opc = OPC_MAX_U),
-	INSTR(AND,          instr_cat2, .opc = OPC_AND_B),
-	INSTR(OR,           instr_cat2, .opc = OPC_OR_B),
-	INSTR(NOT,          instr_cat2, .opc = OPC_NOT_B),
-	INSTR(XOR,          instr_cat2, .opc = OPC_XOR_B),
-	INSTR(UMUL,         instr_cat2, .opc = OPC_MUL_U),
-	INSTR(SHL,          instr_cat2, .opc = OPC_SHL_B),
-	INSTR(USHR,         instr_cat2, .opc = OPC_SHR_B),
-	INSTR(ISHR,         instr_cat2, .opc = OPC_ASHR_B),
-	INSTR(IABS,         instr_cat2, .opc = OPC_ABSNEG_S),
-	INSTR(INEG,         instr_cat2, .opc = OPC_ABSNEG_S),
-	INSTR(AND,          instr_cat2, .opc = OPC_AND_B),
 	INSTR(MAD,          instr_cat3, .opc = OPC_MAD_F32, .hopc = OPC_MAD_F16),
 	INSTR(TRUNC,        instr_cat2, .opc = OPC_TRUNC_F),
 	INSTR(CLAMP,        trans_clamp),
@@ -2031,33 +1741,16 @@ static const struct instr_translater translaters[TGSI_OPCODE_LAST] = {
 	INSTR(TXP,          trans_samp, .opc = OPC_SAM, .arg = TGSI_OPCODE_TXP),
 	INSTR(SGT,          trans_cmp),
 	INSTR(SLT,          trans_cmp),
-	INSTR(FSLT,         trans_cmp),
 	INSTR(SGE,          trans_cmp),
-	INSTR(FSGE,         trans_cmp),
 	INSTR(SLE,          trans_cmp),
 	INSTR(SNE,          trans_cmp),
-	INSTR(FSNE,         trans_cmp),
 	INSTR(SEQ,          trans_cmp),
-	INSTR(FSEQ,         trans_cmp),
 	INSTR(CMP,          trans_cmp),
-	INSTR(USNE,         trans_icmp, .opc = OPC_CMPS_U),
-	INSTR(USEQ,         trans_icmp, .opc = OPC_CMPS_U),
-	INSTR(ISGE,         trans_icmp, .opc = OPC_CMPS_S),
-	INSTR(USGE,         trans_icmp, .opc = OPC_CMPS_U),
-	INSTR(ISLT,         trans_icmp, .opc = OPC_CMPS_S),
-	INSTR(USLT,         trans_icmp, .opc = OPC_CMPS_U),
-	INSTR(UCMP,         trans_icmp, .opc = OPC_CMPS_U),
 	INSTR(IF,           trans_if),
-	INSTR(UIF,          trans_if),
 	INSTR(ELSE,         trans_else),
 	INSTR(ENDIF,        trans_endif),
 	INSTR(END,          instr_cat0, .opc = OPC_END),
 	INSTR(KILL,         trans_kill, .opc = OPC_KILL),
-	INSTR(KILL_IF,      trans_killif, .opc = OPC_KILL),
-	INSTR(I2F,          trans_cov),
-	INSTR(U2F,          trans_cov),
-	INSTR(F2I,          trans_cov),
-	INSTR(F2U,          trans_cov),
 };

 static fd3_semantic
@@ -2242,8 +1935,6 @@ decl_in(struct fd3_compile_context *ctx, struct tgsi_full_declaration *decl)

 		DBG("decl in -> r%d", i);

-		compile_assert(ctx, n < ARRAY_SIZE(so->inputs));
-
 		so->inputs[n].semantic = decl_semantic(&decl->Semantic);
 		so->inputs[n].compmask = (1 << ncomp) - 1;
 		so->inputs[n].regid = r;
@@ -2333,8 +2024,6 @@ decl_out(struct fd3_compile_context *ctx, struct tgsi_full_declaration *decl)

 		ncomp = 4;

-		compile_assert(ctx, n < ARRAY_SIZE(so->outputs));
-
 		so->outputs[n].semantic = decl_semantic(&decl->Semantic);
 		so->outputs[n].regid = regid(i, comp);

@@ -2458,7 +2147,6 @@ compile_instructions(struct fd3_compile_context *ctx)
 			struct tgsi_full_immediate *imm =
 					&ctx->parser.FullToken.FullImmediate;
 			unsigned n = ctx->so->immediates_count++;
-			compile_assert(ctx, n < ARRAY_SIZE(ctx->so->immediates));
 			memcpy(ctx->so->immediates[n].val, imm->u, 16);
 			break;
 		}
--- a/src/gallium/drivers/freedreno/a3xx/fd3_compiler_old.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_compiler_old.c
@@ -1324,8 +1324,6 @@ decl_in(struct fd3_compile_context *ctx, struct tgsi_full_declaration *decl)

 		DBG("decl in -> r%d", i + base);   // XXX

-		compile_assert(ctx, n < ARRAY_SIZE(so->inputs));
-
 		so->inputs[n].semantic = decl_semantic(&decl->Semantic);
 		so->inputs[n].compmask = (1 << ncomp) - 1;
 		so->inputs[n].ncomp = ncomp;
@@ -1412,7 +1410,6 @@ decl_out(struct fd3_compile_context *ctx, struct tgsi_full_declaration *decl)

 	for (i = decl->Range.First; i <= decl->Range.Last; i++) {
 		unsigned n = so->outputs_count++;
-		compile_assert(ctx, n < ARRAY_SIZE(so->outputs));
 		so->outputs[n].semantic = decl_semantic(&decl->Semantic);
 		so->outputs[n].regid = regid(i + base, comp);
 	}
--- a/src/gallium/drivers/freedreno/a3xx/fd3_context.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_context.c
@@ -33,7 +33,6 @@
 #include "fd3_emit.h"
 #include "fd3_gmem.h"
 #include "fd3_program.h"
-#include "fd3_query.h"
 #include "fd3_rasterizer.h"
 #include "fd3_texture.h"
 #include "fd3_zsa.h"
@@ -135,7 +134,5 @@ fd3_context_create(struct pipe_screen *pscreen, void *priv)
 	fd3_ctx->solid_vbuf = create_solid_vertexbuf(pctx);
 	fd3_ctx->blit_texcoord_vbuf = create_blit_texcoord_vertexbuf(pctx);

-	fd3_query_context_init(pctx);
-
 	return pctx;
 }
--- a/src/gallium/drivers/freedreno/a3xx/fd3_emit.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_emit.c
@@ -195,10 +195,8 @@ emit_textures(struct fd_ringbuffer *ring,
 		OUT_RING(ring, CP_LOAD_STATE_1_STATE_TYPE(ST_CONSTANTS) |
 				CP_LOAD_STATE_1_EXT_SRC_ADDR(0));
 		for (i = 0; i < tex->num_textures; i++) {
-			static const struct fd3_pipe_sampler_view dummy_view = {};
-			const struct fd3_pipe_sampler_view *view = tex->textures[i] ?
-					fd3_pipe_sampler_view(tex->textures[i]) :
-					&dummy_view;
+			struct fd3_pipe_sampler_view *view =
+					fd3_pipe_sampler_view(tex->textures[i]);
 			OUT_RING(ring, view->texconst0);
 			OUT_RING(ring, view->texconst1);
 			OUT_RING(ring, view->texconst2 |
@@ -215,10 +213,8 @@ emit_textures(struct fd_ringbuffer *ring,
 		OUT_RING(ring, CP_LOAD_STATE_1_STATE_TYPE(ST_CONSTANTS) |
 				CP_LOAD_STATE_1_EXT_SRC_ADDR(0));
 		for (i = 0; i < tex->num_textures; i++) {
-			static const struct fd3_pipe_sampler_view dummy_view = {};
-			const struct fd3_pipe_sampler_view *view = tex->textures[i] ?
-					fd3_pipe_sampler_view(tex->textures[i]) :
-					&dummy_view;
+			struct fd3_pipe_sampler_view *view =
+					fd3_pipe_sampler_view(tex->textures[i]);
 			struct fd_resource *rsc = view->tex_resource;

 			for (j = 0; j < view->mipaddrs; j++) {
@@ -327,12 +323,9 @@ fd3_emit_vertex_bufs(struct fd_ringbuffer *ring,
 		if (vp->inputs[i].compmask) {
 			struct pipe_resource *prsc = vbufs[i].prsc;
 			struct fd_resource *rsc = fd_resource(prsc);
-			enum pipe_format pfmt = vbufs[i].format;
-			enum a3xx_vtx_fmt fmt = fd3_pipe2vtx(pfmt);
+			enum a3xx_vtx_fmt fmt = fd3_pipe2vtx(vbufs[i].format);
 			bool switchnext = (i != last);
-			uint32_t fs = util_format_get_blocksize(pfmt);
-
-			debug_assert(fmt != ~0);
+			uint32_t fs = util_format_get_blocksize(vbufs[i].format);

 			OUT_PKT0(ring, REG_A3XX_VFD_FETCH(j), 2);
 			OUT_RING(ring, A3XX_VFD_FETCH_INSTR_0_FETCHSIZE(fs - 1) |
@@ -346,7 +339,6 @@ fd3_emit_vertex_bufs(struct fd_ringbuffer *ring,
 			OUT_RING(ring, A3XX_VFD_DECODE_INSTR_CONSTFILL |
 					A3XX_VFD_DECODE_INSTR_WRITEMASK(vp->inputs[i].compmask) |
 					A3XX_VFD_DECODE_INSTR_FORMAT(fmt) |
-					A3XX_VFD_DECODE_INSTR_SWAP(fd3_pipe2swap(pfmt)) |
 					A3XX_VFD_DECODE_INSTR_REGID(vp->inputs[i].regid) |
 					A3XX_VFD_DECODE_INSTR_SHIFTCNT(fs) |
 					A3XX_VFD_DECODE_INSTR_LASTCOMPVALID |
--- a/src/gallium/drivers/freedreno/a3xx/fd3_gmem.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_gmem.c
@@ -82,7 +82,7 @@ emit_mrt(struct fd_ringbuffer *ring, unsigned nr_bufs,
 				stride = bin_w * rsc->cpp;

 				if (bases) {
-					base = bases[i];
+					base = bases[i] * rsc->cpp;
 				}
 			} else {
 				stride = slice->pitch * rsc->cpp;
@@ -106,17 +106,9 @@ emit_mrt(struct fd_ringbuffer *ring, unsigned nr_bufs,
 }

 static uint32_t
-depth_base(struct fd_context *ctx)
+depth_base(struct fd_gmem_stateobj *gmem)
 {
-	struct fd_gmem_stateobj *gmem = &ctx->gmem;
-	struct pipe_framebuffer_state *pfb = &ctx->framebuffer;
-	uint32_t cpp = 4;
-	if (pfb->cbufs[0]) {
-		struct fd_resource *rsc =
-				fd_resource(pfb->cbufs[0]->texture);
-		cpp = rsc->cpp;
-	}
-	return align(gmem->bin_w * gmem->bin_h * cpp, 0x4000);
+	return align(gmem->bin_w * gmem->bin_h, 0x4000);
 }

 static bool
@@ -164,7 +156,7 @@ emit_binning_workaround(struct fd_context *ctx)
 	OUT_RING(ring, A3XX_RB_COPY_CONTROL_MSAA_RESOLVE(MSAA_ONE) |
 			A3XX_RB_COPY_CONTROL_MODE(0) |
 			A3XX_RB_COPY_CONTROL_GMEM_BASE(0));
-	OUT_RELOCW(ring, fd_resource(fd3_ctx->solid_vbuf)->bo, 0x20, 0, -1);  /* RB_COPY_DEST_BASE */
+	OUT_RELOC(ring, fd_resource(fd3_ctx->solid_vbuf)->bo, 0x20, 0, -1);  /* RB_COPY_DEST_BASE */
 	OUT_RING(ring, A3XX_RB_COPY_DEST_PITCH_PITCH(128));
 	OUT_RING(ring, A3XX_RB_COPY_DEST_INFO_TILE(LINEAR) |
 			A3XX_RB_COPY_DEST_INFO_FORMAT(RB_R8G8B8A8_UNORM) |
@@ -407,7 +399,12 @@ fd3_emit_tile_gmem2mem(struct fd_context *ctx, struct fd_tile *tile)
 			}}, 1);

 	if (ctx->resolve & (FD_BUFFER_DEPTH | FD_BUFFER_STENCIL)) {
-		uint32_t base = depth_base(ctx);
+		uint32_t base = 0;
+		if (pfb->cbufs[0]) {
+			struct fd_resource *rsc =
+					fd_resource(pfb->cbufs[0]->texture);
+			base = depth_base(&ctx->gmem) * rsc->cpp;
+		}
 		emit_gmem2mem_surf(ctx, RB_COPY_DEPTH_STENCIL, base, pfb->zsbuf);
 	}

@@ -461,7 +458,7 @@ fd3_emit_tile_mem2gmem(struct fd_context *ctx, struct fd_tile *tile)
 	y1 = ((float)tile->yoff + bin_h) / ((float)pfb->height);

 	OUT_PKT3(ring, CP_MEM_WRITE, 5);
-	OUT_RELOCW(ring, fd_resource(fd3_ctx->blit_texcoord_vbuf)->bo, 0, 0, 0);
+	OUT_RELOC(ring, fd_resource(fd3_ctx->blit_texcoord_vbuf)->bo, 0, 0, 0);
 	OUT_RING(ring, fui(x0));
 	OUT_RING(ring, fui(y0));
 	OUT_RING(ring, fui(x1));
@@ -561,7 +558,7 @@ fd3_emit_tile_mem2gmem(struct fd_context *ctx, struct fd_tile *tile)
 	bin_h = gmem->bin_h;

 	if (ctx->restore & (FD_BUFFER_DEPTH | FD_BUFFER_STENCIL))
-		emit_mem2gmem_surf(ctx, depth_base(ctx), pfb->zsbuf, bin_w);
+		emit_mem2gmem_surf(ctx, depth_base(gmem), pfb->zsbuf, bin_w);

 	if (ctx->restore & FD_BUFFER_COLOR)
 		emit_mem2gmem_surf(ctx, 0, pfb->cbufs[0], bin_w);
@@ -642,7 +639,7 @@ update_vsc_pipe(struct fd_context *ctx)
 	int i;

 	OUT_PKT0(ring, REG_A3XX_VSC_SIZE_ADDRESS, 1);
-	OUT_RELOCW(ring, fd3_ctx->vsc_size_mem, 0, 0, 0); /* VSC_SIZE_ADDRESS */
+	OUT_RELOC(ring, fd3_ctx->vsc_size_mem, 0, 0, 0); /* VSC_SIZE_ADDRESS */

 	for (i = 0; i < 8; i++) {
 		struct fd_vsc_pipe *pipe = &ctx->pipe[i];
@@ -657,7 +654,7 @@ update_vsc_pipe(struct fd_context *ctx)
 				A3XX_VSC_PIPE_CONFIG_Y(pipe->y) |
 				A3XX_VSC_PIPE_CONFIG_W(pipe->w) |
 				A3XX_VSC_PIPE_CONFIG_H(pipe->h));
-		OUT_RELOCW(ring, pipe->bo, 0, 0, 0);       /* VSC_PIPE[i].DATA_ADDRESS */
+		OUT_RELOC(ring, pipe->bo, 0, 0, 0);        /* VSC_PIPE[i].DATA_ADDRESS */
 		OUT_RING(ring, fd_bo_size(pipe->bo) - 32); /* VSC_PIPE[i].DATA_LENGTH */
 	}
 }
@@ -792,7 +789,6 @@ fd3_emit_tile_init(struct fd_context *ctx)
 {
 	struct fd_ringbuffer *ring = ctx->ring;
 	struct fd_gmem_stateobj *gmem = &ctx->gmem;
-	uint32_t rb_render_control;

 	fd3_emit_restore(ctx);

@@ -817,10 +813,8 @@ fd3_emit_tile_init(struct fd_context *ctx)
 		patch_draws(ctx, IGNORE_VISIBILITY);
 	}

-	rb_render_control = A3XX_RB_RENDER_CONTROL_ENABLE_GMEM |
-			A3XX_RB_RENDER_CONTROL_BIN_WIDTH(gmem->bin_w);
-
-	patch_rbrc(ctx, rb_render_control);
+	patch_rbrc(ctx, A3XX_RB_RENDER_CONTROL_ENABLE_GMEM |
+			A3XX_RB_RENDER_CONTROL_BIN_WIDTH(gmem->bin_w));
 }

 /* before mem2gmem */
@@ -833,7 +827,7 @@ fd3_emit_tile_prep(struct fd_context *ctx, struct fd_tile *tile)
 	uint32_t reg;

 	OUT_PKT0(ring, REG_A3XX_RB_DEPTH_INFO, 2);
-	reg = A3XX_RB_DEPTH_INFO_DEPTH_BASE(depth_base(ctx));
+	reg = A3XX_RB_DEPTH_INFO_DEPTH_BASE(depth_base(gmem));
 	if (pfb->zsbuf) {
 		reg |= A3XX_RB_DEPTH_INFO_DEPTH_FORMAT(fd_pipe2depth(pfb->zsbuf->format));
 	}
--- a/src/gallium/drivers/freedreno/a3xx/fd3_program.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_program.c
@@ -406,7 +406,7 @@ fd3_program_emit(struct fd_ringbuffer *ring,
 			A3XX_SP_VS_PARAM_REG_PSIZEREGID(psize_regid) |
 			A3XX_SP_VS_PARAM_REG_TOTALVSOUTVAR(align(fp->total_in, 4) / 4));

-	for (i = 0, j = -1; (i < 8) && (j < (int)fp->inputs_count); i++) {
+	for (i = 0, j = -1; j < (int)fp->inputs_count; i++) {
 		uint32_t reg = 0;

 		OUT_PKT0(ring, REG_A3XX_SP_VS_OUT_REG(i), 1);
@@ -428,7 +428,7 @@ fd3_program_emit(struct fd_ringbuffer *ring,
 		OUT_RING(ring, reg);
 	}

-	for (i = 0, j = -1; (i < 4) && (j < (int)fp->inputs_count); i++) {
+	for (i = 0, j = -1; j < (int)fp->inputs_count; i++) {
 		uint32_t reg = 0;

 		OUT_PKT0(ring, REG_A3XX_SP_VS_VPC_DST_REG(i), 1);
--- a/src/gallium/drivers/freedreno/a3xx/fd3_program.h
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_program.h
@@ -91,7 +91,7 @@ struct fd3_shader_variant {
 	struct {
 		fd3_semantic semantic;
 		uint8_t regid;
-	} outputs[16 + 2];  /* +POSITION +PSIZE */
+	} outputs[16];
 	bool writes_pos, writes_psize;

 	/* vertices/inputs: */
@@ -104,7 +104,7 @@ struct fd3_shader_variant {
 		/* in theory inloc of fs should match outloc of vs: */
 		uint8_t inloc;
 		uint8_t bary;
-	} inputs[16 + 2];  /* +POSITION +FACE */
+	} inputs[16];

 	unsigned total_in;       /* sum of inputs (scalar) */

--- a/src/gallium/drivers/freedreno/a3xx/fd3_query.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_query.c
@@ -1,139 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#include "freedreno_query_hw.h"
-#include "freedreno_context.h"
-#include "freedreno_util.h"
-
-#include "fd3_query.h"
-#include "fd3_util.h"
-
-
-struct fd_rb_samp_ctrs {
-	uint64_t ctr[16];
-};
-
-/*
- * Occlusion Query:
- *
- * OCCLUSION_COUNTER and OCCLUSION_PREDICATE differ only in how they
- * interpret results
- */
-
-static struct fd_hw_sample *
-occlusion_get_sample(struct fd_context *ctx, struct fd_ringbuffer *ring)
-{
-	struct fd_hw_sample *samp =
-			fd_hw_sample_init(ctx, sizeof(struct fd_rb_samp_ctrs));
-
-	/* Set RB_SAMPLE_COUNT_ADDR to samp->offset plus value of
-	 * HW_QUERY_BASE_REG register:
-	 */
-	OUT_PKT3(ring, CP_SET_CONSTANT, 3);
-	OUT_RING(ring, CP_REG(REG_A3XX_RB_SAMPLE_COUNT_ADDR) | 0x80000000);
-	OUT_RING(ring, HW_QUERY_BASE_REG);
-	OUT_RING(ring, samp->offset);
-
-	OUT_PKT0(ring, REG_A3XX_RB_SAMPLE_COUNT_CONTROL, 1);
-	OUT_RING(ring, A3XX_RB_SAMPLE_COUNT_CONTROL_COPY);
-
-	OUT_PKT3(ring, CP_DRAW_INDX, 3);
-	OUT_RING(ring, 0x00000000);
-	OUT_RING(ring, DRAW(DI_PT_POINTLIST_A2XX, DI_SRC_SEL_AUTO_INDEX,
-			INDEX_SIZE_IGN, USE_VISIBILITY));
-	OUT_RING(ring, 0);             /* NumIndices */
-
-	OUT_PKT3(ring, CP_EVENT_WRITE, 1);
-	OUT_RING(ring, ZPASS_DONE);
-
-	OUT_PKT0(ring, REG_A3XX_RBBM_PERFCTR_CTL, 1);
-	OUT_RING(ring, A3XX_RBBM_PERFCTR_CTL_ENABLE);
-
-	OUT_PKT0(ring, REG_A3XX_VBIF_PERF_CNT_EN, 1);
-	OUT_RING(ring, A3XX_VBIF_PERF_CNT_EN_CNT0 |
-			A3XX_VBIF_PERF_CNT_EN_CNT1 |
-			A3XX_VBIF_PERF_CNT_EN_PWRCNT0 |
-			A3XX_VBIF_PERF_CNT_EN_PWRCNT1 |
-			A3XX_VBIF_PERF_CNT_EN_PWRCNT2);
-
-	return samp;
-}
-
-static uint64_t
-count_samples(const struct fd_rb_samp_ctrs *start,
-		const struct fd_rb_samp_ctrs *end)
-{
-	uint64_t n = 0;
-	unsigned i;
-
-	/* not quite sure what all of these are, possibly different
-	 * counters for each MRT render target:
-	 */
-	for (i = 0; i < 16; i += 4)
-		n += end->ctr[i] - start->ctr[i];
-
-	return n;
-}
-
-static void
-occlusion_counter_accumulate_result(struct fd_context *ctx,
-		const void *start, const void *end,
-		union pipe_query_result *result)
-{
-	uint64_t n = count_samples(start, end);
-	result->u64 += n;
-}
-
-static void
-occlusion_predicate_accumulate_result(struct fd_context *ctx,
-		const void *start, const void *end,
-		union pipe_query_result *result)
-{
-	uint64_t n = count_samples(start, end);
-	result->b |= (n > 0);
-}
-
-static const struct fd_hw_sample_provider occlusion_counter = {
-		.query_type = PIPE_QUERY_OCCLUSION_COUNTER,
-		.active = FD_STAGE_DRAW, /* | FD_STAGE_CLEAR ??? */
-		.get_sample = occlusion_get_sample,
-		.accumulate_result = occlusion_counter_accumulate_result,
-};
-
-static const struct fd_hw_sample_provider occlusion_predicate = {
-		.query_type = PIPE_QUERY_OCCLUSION_PREDICATE,
-		.active = FD_STAGE_DRAW, /* | FD_STAGE_CLEAR ??? */
-		.get_sample = occlusion_get_sample,
-		.accumulate_result = occlusion_predicate_accumulate_result,
-};
-
-void fd3_query_context_init(struct pipe_context *pctx)
-{
-	fd_hw_query_register_provider(pctx, &occlusion_counter);
-	fd_hw_query_register_provider(pctx, &occlusion_predicate);
-}
--- a/src/gallium/drivers/freedreno/a3xx/fd3_query.h
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_query.h
@@ -1,36 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#ifndef FD3_QUERY_H_
-#define FD3_QUERY_H_
-
-#include "pipe/p_context.h"
-
-void fd3_query_context_init(struct pipe_context *pctx);
-
-#endif /* FD3_QUERY_H_ */
--- a/src/gallium/drivers/freedreno/a3xx/fd3_rasterizer.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_rasterizer.c
@@ -40,7 +40,6 @@ fd3_rasterizer_state_create(struct pipe_context *pctx,
 		const struct pipe_rasterizer_state *cso)
 {
 	struct fd3_rasterizer_stateobj *so;
-	float psize_min, psize_max;

 	so = CALLOC_STRUCT(fd3_rasterizer_stateobj);
 	if (!so)
@@ -48,28 +47,19 @@ fd3_rasterizer_state_create(struct pipe_context *pctx,

 	so->base = *cso;

-	if (cso->point_size_per_vertex) {
-		psize_min = util_get_min_point_size(cso);
-		psize_max = 8192;
-	} else {
-		/* Force the point size to be as if the vertex output was disabled. */
-		psize_min = cso->point_size;
-		psize_max = cso->point_size;
-	}
-
 /*
 	if (cso->line_stipple_enable) {
 		??? TODO line stipple
 	}
 	TODO cso->half_pixel_center
+	TODO cso->point_size
+	TODO psize_min/psize_max
 	if (cso->multisample)
 		TODO
 */
 	so->gras_cl_clip_cntl = A3XX_GRAS_CL_CLIP_CNTL_IJ_PERSP_CENTER; /* ??? */
-	so->gras_su_point_minmax =
-			A3XX_GRAS_SU_POINT_MINMAX_MIN(psize_min/2) |
-			A3XX_GRAS_SU_POINT_MINMAX_MAX(psize_max/2);
-	so->gras_su_point_size   = A3XX_GRAS_SU_POINT_SIZE(cso->point_size/2);
+	so->gras_su_point_minmax = 0xffc00010;  /* ??? */
+	so->gras_su_point_size   = 0x00000008;  /* ??? */
 	so->gras_su_poly_offset_scale =
 			A3XX_GRAS_SU_POLY_OFFSET_SCALE_VAL(cso->offset_scale);
 	so->gras_su_poly_offset_offset =
--- a/src/gallium/drivers/freedreno/a3xx/fd3_texture.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_texture.c
@@ -30,7 +30,6 @@
 #include "util/u_string.h"
 #include "util/u_memory.h"
 #include "util/u_inlines.h"
-#include "util/u_format.h"

 #include "fd3_texture.h"
 #include "fd3_util.h"
@@ -48,14 +47,12 @@ tex_clamp(unsigned wrap)
 	case PIPE_TEX_WRAP_REPEAT:
 		return A3XX_TEX_REPEAT;
 	case PIPE_TEX_WRAP_CLAMP:
+	case PIPE_TEX_WRAP_CLAMP_TO_BORDER:
 	case PIPE_TEX_WRAP_CLAMP_TO_EDGE:
 		return A3XX_TEX_CLAMP_TO_EDGE;
-	case PIPE_TEX_WRAP_CLAMP_TO_BORDER:
-		return A3XX_TEX_CLAMP_TO_BORDER;
 	case PIPE_TEX_WRAP_MIRROR_CLAMP:
 	case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER:
 	case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE:
-		return A3XX_TEX_MIRROR_CLAMP;
 	case PIPE_TEX_WRAP_MIRROR_REPEAT:
 		return A3XX_TEX_MIRROR_REPEAT;
 	default:
@@ -102,9 +99,6 @@ fd3_sampler_state_create(struct pipe_context *pctx,
 			A3XX_TEX_SAMP_0_WRAP_T(tex_clamp(cso->wrap_t)) |
 			A3XX_TEX_SAMP_0_WRAP_R(tex_clamp(cso->wrap_r));

-	if (cso->compare_mode)
-		so->texsamp0 |= A3XX_TEX_SAMP_0_COMPARE_FUNC(cso->compare_func); /* maps 1:1 */
-
 	if (cso->min_mip_filter != PIPE_TEX_MIPFILTER_NONE) {
 		so->texsamp1 =
 				A3XX_TEX_SAMP_1_MIN_LOD(cso->min_lod) |
@@ -164,10 +158,6 @@ fd3_sampler_view_create(struct pipe_context *pctx, struct pipe_resource *prsc,
 			A3XX_TEX_CONST_0_MIPLVLS(miplevels) |
 			fd3_tex_swiz(cso->format, cso->swizzle_r, cso->swizzle_g,
 						cso->swizzle_b, cso->swizzle_a);
-
-	if (util_format_is_srgb(cso->format))
-		so->texconst0 |= A3XX_TEX_CONST_0_SRGB;
-
 	so->texconst1 =
 			A3XX_TEX_CONST_1_FETCHSIZE(fd3_pipe2fetchsize(cso->format)) |
 			A3XX_TEX_CONST_1_WIDTH(prsc->width0) |
--- a/src/gallium/drivers/freedreno/a3xx/fd3_util.c
+++ b/src/gallium/drivers/freedreno/a3xx/fd3_util.c
@@ -37,44 +37,70 @@ fd3_pipe2vtx(enum pipe_format format)
 {
 	switch (format) {
 	/* 8-bit buffers. */
+	case PIPE_FORMAT_A8_UNORM:
+	case PIPE_FORMAT_I8_UNORM:
+	case PIPE_FORMAT_L8_UNORM:
 	case PIPE_FORMAT_R8_UNORM:
+	case PIPE_FORMAT_L8_SRGB:
 		return VFMT_NORM_UBYTE_8;

+	case PIPE_FORMAT_A8_SNORM:
+	case PIPE_FORMAT_I8_SNORM:
+	case PIPE_FORMAT_L8_SNORM:
 	case PIPE_FORMAT_R8_SNORM:
 		return VFMT_NORM_BYTE_8;

+	case PIPE_FORMAT_A8_UINT:
+	case PIPE_FORMAT_I8_UINT:
+	case PIPE_FORMAT_L8_UINT:
 	case PIPE_FORMAT_R8_UINT:
 		return VFMT_UBYTE_8;

+	case PIPE_FORMAT_A8_SINT:
+	case PIPE_FORMAT_I8_SINT:
+	case PIPE_FORMAT_L8_SINT:
 	case PIPE_FORMAT_R8_SINT:
 		return VFMT_BYTE_8;

 	/* 16-bit buffers. */
 	case PIPE_FORMAT_R16_UNORM:
+	case PIPE_FORMAT_A16_UNORM:
+	case PIPE_FORMAT_L16_UNORM:
+	case PIPE_FORMAT_I16_UNORM:
 	case PIPE_FORMAT_Z16_UNORM:
 		return VFMT_NORM_USHORT_16;

 	case PIPE_FORMAT_R16_SNORM:
+	case PIPE_FORMAT_A16_SNORM:
+	case PIPE_FORMAT_L16_SNORM:
+	case PIPE_FORMAT_I16_SNORM:
 		return VFMT_NORM_SHORT_16;

 	case PIPE_FORMAT_R16_UINT:
+	case PIPE_FORMAT_A16_UINT:
+	case PIPE_FORMAT_L16_UINT:
+	case PIPE_FORMAT_I16_UINT:
 		return VFMT_USHORT_16;

 	case PIPE_FORMAT_R16_SINT:
+	case PIPE_FORMAT_A16_SINT:
+	case PIPE_FORMAT_L16_SINT:
+	case PIPE_FORMAT_I16_SINT:
 		return VFMT_SHORT_16;

-	case PIPE_FORMAT_R16_FLOAT:
-		return VFMT_FLOAT_16;
-
+	case PIPE_FORMAT_L8A8_UNORM:
 	case PIPE_FORMAT_R8G8_UNORM:
 		return VFMT_NORM_UBYTE_8_8;

+	case PIPE_FORMAT_L8A8_SNORM:
 	case PIPE_FORMAT_R8G8_SNORM:
 		return VFMT_NORM_BYTE_8_8;

+	case PIPE_FORMAT_L8A8_UINT:
 	case PIPE_FORMAT_R8G8_UINT:
 		return VFMT_UBYTE_8_8;

+	case PIPE_FORMAT_L8A8_SINT:
 	case PIPE_FORMAT_R8G8_SINT:
 		return VFMT_BYTE_8_8;

@@ -95,62 +121,42 @@ fd3_pipe2vtx(enum pipe_format format)
 	case PIPE_FORMAT_A8B8G8R8_UNORM:
 	case PIPE_FORMAT_A8R8G8B8_UNORM:
 	case PIPE_FORMAT_B8G8R8A8_UNORM:
+	case PIPE_FORMAT_B8G8R8X8_UNORM:
 	case PIPE_FORMAT_R8G8B8A8_UNORM:
+	case PIPE_FORMAT_R8G8B8X8_UNORM:
+	case PIPE_FORMAT_X8B8G8R8_UNORM:
+	case PIPE_FORMAT_X8R8G8B8_UNORM:
+	case PIPE_FORMAT_A8B8G8R8_SRGB:
+	case PIPE_FORMAT_B8G8R8A8_SRGB:
 		return VFMT_NORM_UBYTE_8_8_8_8;

 	case PIPE_FORMAT_R8G8B8A8_SNORM:
+	case PIPE_FORMAT_R8G8B8X8_SNORM:
 		return VFMT_NORM_BYTE_8_8_8_8;

 	case PIPE_FORMAT_R8G8B8A8_UINT:
+	case PIPE_FORMAT_R8G8B8X8_UINT:
 		return VFMT_UBYTE_8_8_8_8;

 	case PIPE_FORMAT_R8G8B8A8_SINT:
+	case PIPE_FORMAT_R8G8B8X8_SINT:
 		return VFMT_BYTE_8_8_8_8;

-	case PIPE_FORMAT_R16G16_SSCALED:
-		return VFMT_SHORT_16_16;
-
-	case PIPE_FORMAT_R16G16_FLOAT:
-		return VFMT_FLOAT_16_16;
-
-	case PIPE_FORMAT_R16G16_UINT:
-		return VFMT_USHORT_16_16;
-
-	case PIPE_FORMAT_R16G16_UNORM:
-		return VFMT_NORM_USHORT_16_16;
-
-	case PIPE_FORMAT_R16G16_SNORM:
-		return VFMT_NORM_SHORT_16_16;
-
-	case PIPE_FORMAT_R10G10B10A2_UNORM:
-		return VFMT_NORM_UINT_10_10_10_2;
-
-	case PIPE_FORMAT_R10G10B10A2_SNORM:
-		return VFMT_NORM_INT_10_10_10_2;
-
-	case PIPE_FORMAT_R10G10B10A2_USCALED:
-		return VFMT_UINT_10_10_10_2;
-
-	case PIPE_FORMAT_R10G10B10A2_SSCALED:
-		return VFMT_INT_10_10_10_2;
-
-	/* 48-bit buffers. */
-	case PIPE_FORMAT_R16G16B16_FLOAT:
-		return VFMT_FLOAT_16_16_16;
-
-	case PIPE_FORMAT_R16G16B16_SSCALED:
-		return VFMT_SHORT_16_16_16;
-
-	case PIPE_FORMAT_R16G16B16_UINT:
-		return VFMT_USHORT_16_16_16;
-
-	case PIPE_FORMAT_R16G16B16_SNORM:
-		return VFMT_NORM_SHORT_16_16_16;
-
-	case PIPE_FORMAT_R16G16B16_UNORM:
-		return VFMT_NORM_USHORT_16_16_16;
+/* TODO probably need gles3 blob drivers to find the 32bit int formats:
+	case PIPE_FORMAT_R32_UINT:
+	case PIPE_FORMAT_R32_SINT:
+	case PIPE_FORMAT_A32_UINT:
+	case PIPE_FORMAT_A32_SINT:
+	case PIPE_FORMAT_L32_UINT:
+	case PIPE_FORMAT_L32_SINT:
+	case PIPE_FORMAT_I32_UINT:
+	case PIPE_FORMAT_I32_SINT:
+*/

 	case PIPE_FORMAT_R32_FLOAT:
+	case PIPE_FORMAT_A32_FLOAT:
+	case PIPE_FORMAT_L32_FLOAT:
+	case PIPE_FORMAT_I32_FLOAT:
 	case PIPE_FORMAT_Z32_FLOAT:
 		return VFMT_FLOAT_32;

@@ -171,14 +177,23 @@ fd3_pipe2vtx(enum pipe_format format)
 		return VFMT_SHORT_16_16_16_16;

 	case PIPE_FORMAT_R32G32_FLOAT:
+	case PIPE_FORMAT_L32A32_FLOAT:
 		return VFMT_FLOAT_32_32;

 	case PIPE_FORMAT_R32G32_FIXED:
 		return VFMT_FIXED_32_32;

 	case PIPE_FORMAT_R16G16B16A16_FLOAT:
+	case PIPE_FORMAT_R16G16B16X16_FLOAT:
 		return VFMT_FLOAT_16_16_16_16;

+/* TODO probably need gles3 blob drivers to find the 32bit int formats:
+	case PIPE_FORMAT_R32G32_SINT:
+	case PIPE_FORMAT_R32G32_UINT:
+	case PIPE_FORMAT_L32A32_UINT:
+	case PIPE_FORMAT_L32A32_SINT:
+*/
+
 	/* 96-bit buffers. */
 	case PIPE_FORMAT_R32G32B32_FLOAT:
 		return VFMT_FLOAT_32_32_32;
@@ -188,6 +203,7 @@ fd3_pipe2vtx(enum pipe_format format)

 	/* 128-bit buffers. */
 	case PIPE_FORMAT_R32G32B32A32_FLOAT:
+	case PIPE_FORMAT_R32G32B32X32_FLOAT:
 		return VFMT_FLOAT_32_32_32_32;

 	case PIPE_FORMAT_R32G32B32A32_FIXED:
@@ -198,20 +214,6 @@ fd3_pipe2vtx(enum pipe_format format)
 	case PIPE_FORMAT_R32G32B32A32_UNORM:
 	case PIPE_FORMAT_R32G32B32A32_SINT:
 	case PIPE_FORMAT_R32G32B32A32_UINT:
-
-	case PIPE_FORMAT_R32_UINT:
-	case PIPE_FORMAT_R32_SINT:
-	case PIPE_FORMAT_A32_UINT:
-	case PIPE_FORMAT_A32_SINT:
-	case PIPE_FORMAT_L32_UINT:
-	case PIPE_FORMAT_L32_SINT:
-	case PIPE_FORMAT_I32_UINT:
-	case PIPE_FORMAT_I32_SINT:
-
-	case PIPE_FORMAT_R32G32_SINT:
-	case PIPE_FORMAT_R32G32_UINT:
-	case PIPE_FORMAT_L32A32_UINT:
-	case PIPE_FORMAT_L32A32_SINT:
 */

 	default:
@@ -233,10 +235,6 @@ fd3_pipe2tex(enum pipe_format format)
 	case PIPE_FORMAT_B8G8R8X8_UNORM:
 	case PIPE_FORMAT_R8G8B8A8_UNORM:
 	case PIPE_FORMAT_R8G8B8X8_UNORM:
-	case PIPE_FORMAT_B8G8R8A8_SRGB:
-	case PIPE_FORMAT_B8G8R8X8_SRGB:
-	case PIPE_FORMAT_R8G8B8A8_SRGB:
-	case PIPE_FORMAT_R8G8B8X8_SRGB:
 		return TFMT_NORM_UINT_8_8_8_8;

 	case PIPE_FORMAT_Z24X8_UNORM:
@@ -277,12 +275,6 @@ fd3_pipe2fetchsize(enum pipe_format format)

 	case PIPE_FORMAT_B8G8R8A8_UNORM:
 	case PIPE_FORMAT_B8G8R8X8_UNORM:
-	case PIPE_FORMAT_R8G8B8A8_UNORM:
-	case PIPE_FORMAT_R8G8B8X8_UNORM:
-	case PIPE_FORMAT_B8G8R8A8_SRGB:
-	case PIPE_FORMAT_B8G8R8X8_SRGB:
-	case PIPE_FORMAT_R8G8B8A8_SRGB:
-	case PIPE_FORMAT_R8G8B8X8_SRGB:
 	case PIPE_FORMAT_Z24X8_UNORM:
 	case PIPE_FORMAT_Z24_UNORM_S8_UINT:
 		return TFETCH_4_BYTE;
@@ -356,22 +348,8 @@ fd3_pipe2swap(enum pipe_format format)
 	switch (format) {
 	case PIPE_FORMAT_B8G8R8A8_UNORM:
 	case PIPE_FORMAT_B8G8R8X8_UNORM:
-	case PIPE_FORMAT_B8G8R8A8_SRGB:
-	case PIPE_FORMAT_B8G8R8X8_SRGB:
 		return WXYZ;

-	case PIPE_FORMAT_A8R8G8B8_UNORM:
-	case PIPE_FORMAT_X8R8G8B8_UNORM:
-	case PIPE_FORMAT_A8R8G8B8_SRGB:
-	case PIPE_FORMAT_X8R8G8B8_SRGB:
-		return ZYXW;
-
-	case PIPE_FORMAT_A8B8G8R8_UNORM:
-	case PIPE_FORMAT_X8B8G8R8_UNORM:
-	case PIPE_FORMAT_A8B8G8R8_SRGB:
-	case PIPE_FORMAT_X8B8G8R8_SRGB:
-		return XYZW;
-
 	case PIPE_FORMAT_R8G8B8A8_UNORM:
 	case PIPE_FORMAT_R8G8B8X8_UNORM:
 	case PIPE_FORMAT_Z24X8_UNORM:
@@ -401,14 +379,14 @@ fd3_tex_swiz(enum pipe_format format, unsigned swizzle_r, unsigned swizzle_g,
 {
 	const struct util_format_description *desc =
 			util_format_description(format);
-	unsigned char swiz[4] = {
+	uint8_t swiz[] = {
 			swizzle_r, swizzle_g, swizzle_b, swizzle_a,
-	}, rswiz[4];
+			PIPE_SWIZZLE_ZERO, PIPE_SWIZZLE_ONE,
+			PIPE_SWIZZLE_ONE, PIPE_SWIZZLE_ONE,
+	};

-	util_format_compose_swizzles(desc->swizzle, swiz, rswiz);
-
-	return A3XX_TEX_CONST_0_SWIZ_X(tex_swiz(rswiz[0])) |
-			A3XX_TEX_CONST_0_SWIZ_Y(tex_swiz(rswiz[1])) |
-			A3XX_TEX_CONST_0_SWIZ_Z(tex_swiz(rswiz[2])) |
-			A3XX_TEX_CONST_0_SWIZ_W(tex_swiz(rswiz[3]));
+	return A3XX_TEX_CONST_0_SWIZ_X(tex_swiz(swiz[desc->swizzle[0]])) |
+			A3XX_TEX_CONST_0_SWIZ_Y(tex_swiz(swiz[desc->swizzle[1]])) |
+			A3XX_TEX_CONST_0_SWIZ_Z(tex_swiz(swiz[desc->swizzle[2]])) |
+			A3XX_TEX_CONST_0_SWIZ_W(tex_swiz(swiz[desc->swizzle[3]]));
 }
--- a/src/gallium/drivers/freedreno/adreno_common.xml.h
+++ b/src/gallium/drivers/freedreno/adreno_common.xml.h
@@ -10,11 +10,11 @@ git clone https://github.com/freedreno/envytools.git
 The rules-ng-ng source files this header was generated from are:
 - /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    364 bytes, from 2013-11-30 14:47:15)
 - /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1453 bytes, from 2013-03-31 16:51:27)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32901 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9859 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  14477 bytes, from 2014-05-16 11:51:57)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  58020 bytes, from 2014-06-13 17:29:47)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (  26602 bytes, from 2014-06-13 17:28:10)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32840 bytes, from 2014-01-05 14:44:21)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9009 bytes, from 2014-01-11 16:56:35)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  12362 bytes, from 2014-01-07 14:47:36)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  56545 bytes, from 2014-02-26 16:32:11)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (   8344 bytes, from 2013-11-30 14:49:47)

 Copyright (C) 2013-2014 by the following authors:
 - Rob Clark <robdclark@gmail.com> (robclark)
@@ -87,6 +87,15 @@ enum adreno_rb_blend_factor {
 	FACTOR_SRC_ALPHA_SATURATE = 16,
 };

+enum adreno_rb_blend_opcode {
+	BLEND_DST_PLUS_SRC = 0,
+	BLEND_SRC_MINUS_DST = 1,
+	BLEND_MIN_DST_SRC = 2,
+	BLEND_MAX_DST_SRC = 3,
+	BLEND_DST_MINUS_SRC = 4,
+	BLEND_DST_PLUS_SRC_BIAS = 5,
+};
+
 enum adreno_rb_surface_endian {
 	ENDIAN_NONE = 0,
 	ENDIAN_8IN16 = 1,
@@ -107,39 +116,6 @@ enum adreno_rb_depth_format {
 	DEPTHX_24_8 = 1,
 };

-enum adreno_rb_copy_control_mode {
-	RB_COPY_RESOLVE = 1,
-	RB_COPY_CLEAR = 2,
-	RB_COPY_DEPTH_STENCIL = 5,
-};
-
-enum a3xx_render_mode {
-	RB_RENDERING_PASS = 0,
-	RB_TILING_PASS = 1,
-	RB_RESOLVE_PASS = 2,
-	RB_COMPUTE_PASS = 3,
-};
-
-enum a3xx_msaa_samples {
-	MSAA_ONE = 0,
-	MSAA_TWO = 1,
-	MSAA_FOUR = 2,
-};
-
-enum a3xx_threadmode {
-	MULTI = 0,
-	SINGLE = 1,
-};
-
-enum a3xx_instrbuffermode {
-	BUFFER = 1,
-};
-
-enum a3xx_threadsize {
-	TWO_QUADS = 0,
-	FOUR_QUADS = 1,
-};
-
 #define REG_AXXX_CP_RB_BASE					0x000001c0

 #define REG_AXXX_CP_RB_CNTL					0x000001c1
--- a/src/gallium/drivers/freedreno/adreno_pm4.xml.h
+++ b/src/gallium/drivers/freedreno/adreno_pm4.xml.h
@@ -10,11 +10,11 @@ git clone https://github.com/freedreno/envytools.git
 The rules-ng-ng source files this header was generated from are:
 - /home/robclark/src/freedreno/envytools/rnndb/adreno.xml               (    364 bytes, from 2013-11-30 14:47:15)
 - /home/robclark/src/freedreno/envytools/rnndb/freedreno_copyright.xml  (   1453 bytes, from 2013-03-31 16:51:27)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32901 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9859 bytes, from 2014-06-02 15:21:30)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  14477 bytes, from 2014-05-16 11:51:57)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  58020 bytes, from 2014-06-13 17:29:47)
- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (  26602 bytes, from 2014-06-13 17:28:10)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a2xx.xml          (  32840 bytes, from 2014-01-05 14:44:21)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_common.xml (   9009 bytes, from 2014-01-11 16:56:35)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/adreno_pm4.xml    (  12362 bytes, from 2014-01-07 14:47:36)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a3xx.xml          (  56545 bytes, from 2014-02-26 16:32:11)
+- /home/robclark/src/freedreno/envytools/rnndb/adreno/a4xx.xml          (   8344 bytes, from 2013-11-30 14:49:47)

 Copyright (C) 2013-2014 by the following authors:
 - Rob Clark <robdclark@gmail.com> (robclark)
@@ -164,11 +164,6 @@ enum adreno_pm4_type3_packets {
 	CP_SET_BIN = 76,
 	CP_TEST_TWO_MEMS = 113,
 	CP_WAIT_FOR_ME = 19,
-	CP_SET_DRAW_STATE = 67,
-	CP_DRAW_INDX_OFFSET = 56,
-	CP_DRAW_INDIRECT = 40,
-	CP_DRAW_INDX_INDIRECT = 41,
-	CP_DRAW_AUTO = 36,
 	IN_IB_PREFETCH_END = 23,
 	IN_SUBBLK_PREFETCH = 31,
 	IN_INSTR_PREFETCH = 32,
@@ -356,93 +351,6 @@ static inline uint32_t CP_DRAW_INDX_2_2_NUM_INDICES(uint32_t val)
 	return ((val) << CP_DRAW_INDX_2_2_NUM_INDICES__SHIFT) & CP_DRAW_INDX_2_2_NUM_INDICES__MASK;
 }

-#define REG_CP_DRAW_INDX_OFFSET_0				0x00000000
-#define CP_DRAW_INDX_OFFSET_0_PRIM_TYPE__MASK			0x0000003f
-#define CP_DRAW_INDX_OFFSET_0_PRIM_TYPE__SHIFT			0
-static inline uint32_t CP_DRAW_INDX_OFFSET_0_PRIM_TYPE(enum pc_di_primtype val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_0_PRIM_TYPE__SHIFT) & CP_DRAW_INDX_OFFSET_0_PRIM_TYPE__MASK;
-}
-#define CP_DRAW_INDX_OFFSET_0_SOURCE_SELECT__MASK		0x000000c0
-#define CP_DRAW_INDX_OFFSET_0_SOURCE_SELECT__SHIFT		6
-static inline uint32_t CP_DRAW_INDX_OFFSET_0_SOURCE_SELECT(enum pc_di_src_sel val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_0_SOURCE_SELECT__SHIFT) & CP_DRAW_INDX_OFFSET_0_SOURCE_SELECT__MASK;
-}
-#define CP_DRAW_INDX_OFFSET_0_VIS_CULL__MASK			0x00000700
-#define CP_DRAW_INDX_OFFSET_0_VIS_CULL__SHIFT			8
-static inline uint32_t CP_DRAW_INDX_OFFSET_0_VIS_CULL(enum pc_di_vis_cull_mode val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_0_VIS_CULL__SHIFT) & CP_DRAW_INDX_OFFSET_0_VIS_CULL__MASK;
-}
-#define CP_DRAW_INDX_OFFSET_0_INDEX_SIZE__MASK			0x00000800
-#define CP_DRAW_INDX_OFFSET_0_INDEX_SIZE__SHIFT			11
-static inline uint32_t CP_DRAW_INDX_OFFSET_0_INDEX_SIZE(enum pc_di_index_size val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_0_INDEX_SIZE__SHIFT) & CP_DRAW_INDX_OFFSET_0_INDEX_SIZE__MASK;
-}
-#define CP_DRAW_INDX_OFFSET_0_NOT_EOP				0x00001000
-#define CP_DRAW_INDX_OFFSET_0_SMALL_INDEX			0x00002000
-#define CP_DRAW_INDX_OFFSET_0_PRE_DRAW_INITIATOR_ENABLE		0x00004000
-#define CP_DRAW_INDX_OFFSET_0_NUM_INDICES__MASK			0xffff0000
-#define CP_DRAW_INDX_OFFSET_0_NUM_INDICES__SHIFT		16
-static inline uint32_t CP_DRAW_INDX_OFFSET_0_NUM_INDICES(uint32_t val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_0_NUM_INDICES__SHIFT) & CP_DRAW_INDX_OFFSET_0_NUM_INDICES__MASK;
-}
-
-#define REG_CP_DRAW_INDX_OFFSET_1				0x00000001
-
-#define REG_CP_DRAW_INDX_OFFSET_2				0x00000002
-#define CP_DRAW_INDX_OFFSET_2_NUM_INDICES__MASK			0xffffffff
-#define CP_DRAW_INDX_OFFSET_2_NUM_INDICES__SHIFT		0
-static inline uint32_t CP_DRAW_INDX_OFFSET_2_NUM_INDICES(uint32_t val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_2_NUM_INDICES__SHIFT) & CP_DRAW_INDX_OFFSET_2_NUM_INDICES__MASK;
-}
-
-#define REG_CP_DRAW_INDX_OFFSET_2				0x00000002
-#define CP_DRAW_INDX_OFFSET_2_INDX_BASE__MASK			0xffffffff
-#define CP_DRAW_INDX_OFFSET_2_INDX_BASE__SHIFT			0
-static inline uint32_t CP_DRAW_INDX_OFFSET_2_INDX_BASE(uint32_t val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_2_INDX_BASE__SHIFT) & CP_DRAW_INDX_OFFSET_2_INDX_BASE__MASK;
-}
-
-#define REG_CP_DRAW_INDX_OFFSET_2				0x00000002
-#define CP_DRAW_INDX_OFFSET_2_INDX_SIZE__MASK			0xffffffff
-#define CP_DRAW_INDX_OFFSET_2_INDX_SIZE__SHIFT			0
-static inline uint32_t CP_DRAW_INDX_OFFSET_2_INDX_SIZE(uint32_t val)
-{
-	return ((val) << CP_DRAW_INDX_OFFSET_2_INDX_SIZE__SHIFT) & CP_DRAW_INDX_OFFSET_2_INDX_SIZE__MASK;
-}
-
-#define REG_CP_SET_DRAW_STATE_0					0x00000000
-#define CP_SET_DRAW_STATE_0_COUNT__MASK				0x0000ffff
-#define CP_SET_DRAW_STATE_0_COUNT__SHIFT			0
-static inline uint32_t CP_SET_DRAW_STATE_0_COUNT(uint32_t val)
-{
-	return ((val) << CP_SET_DRAW_STATE_0_COUNT__SHIFT) & CP_SET_DRAW_STATE_0_COUNT__MASK;
-}
-#define CP_SET_DRAW_STATE_0_DIRTY				0x00010000
-#define CP_SET_DRAW_STATE_0_DISABLE				0x00020000
-#define CP_SET_DRAW_STATE_0_DISABLE_ALL_GROUPS			0x00040000
-#define CP_SET_DRAW_STATE_0_LOAD_IMMED				0x00080000
-#define CP_SET_DRAW_STATE_0_GROUP_ID__MASK			0x1f000000
-#define CP_SET_DRAW_STATE_0_GROUP_ID__SHIFT			24
-static inline uint32_t CP_SET_DRAW_STATE_0_GROUP_ID(uint32_t val)
-{
-	return ((val) << CP_SET_DRAW_STATE_0_GROUP_ID__SHIFT) & CP_SET_DRAW_STATE_0_GROUP_ID__MASK;
-}
-
-#define REG_CP_SET_DRAW_STATE_1					0x00000001
-#define CP_SET_DRAW_STATE_1_ADDR__MASK				0xffffffff
-#define CP_SET_DRAW_STATE_1_ADDR__SHIFT				0
-static inline uint32_t CP_SET_DRAW_STATE_1_ADDR(uint32_t val)
-{
-	return ((val) << CP_SET_DRAW_STATE_1_ADDR__SHIFT) & CP_SET_DRAW_STATE_1_ADDR__MASK;
-}
-
 #define REG_CP_SET_BIN_0					0x00000000

 #define REG_CP_SET_BIN_1					0x00000001
--- a/src/gallium/drivers/freedreno/freedreno_context.c
+++ b/src/gallium/drivers/freedreno/freedreno_context.c
@@ -34,7 +34,6 @@
 #include "freedreno_state.h"
 #include "freedreno_gmem.h"
 #include "freedreno_query.h"
-#include "freedreno_query_hw.h"
 #include "freedreno_util.h"

 static struct fd_ringbuffer *next_rb(struct fd_context *ctx)
@@ -146,7 +145,6 @@ fd_context_destroy(struct pipe_context *pctx)
 	DBG("");

 	fd_prog_fini(pctx);
-	fd_hw_query_fini(pctx);

 	util_slab_destroy(&ctx->transfer_pool);

@@ -223,7 +221,6 @@ fd_context_init(struct fd_context *ctx, struct pipe_screen *pscreen,
 	fd_query_context_init(pctx);
 	fd_texture_init(pctx);
 	fd_state_init(pctx);
-	fd_hw_query_init(pctx);

 	ctx->blitter = util_blitter_create(pctx);
 	if (!ctx->blitter)
--- a/src/gallium/drivers/freedreno/freedreno_context.h
+++ b/src/gallium/drivers/freedreno/freedreno_context.h
@@ -33,7 +33,6 @@
 #include "pipe/p_context.h"
 #include "indices/u_primconvert.h"
 #include "util/u_blitter.h"
-#include "util/u_double_list.h"
 #include "util/u_slab.h"
 #include "util/u_string.h"

@@ -83,80 +82,16 @@ struct fd_vertex_stateobj {
 	unsigned num_elements;
 };

-/* Bitmask of stages in rendering that a particular query query is
- * active.  Queries will be automatically started/stopped (generating
- * additional fd_hw_sample_period's) on entrance/exit from stages that
- * are applicable to the query.
- *
- * NOTE: set the stage to NULL at end of IB to ensure no query is still
- * active.  Things aren't going to work out the way you want if a query
- * is active across IB's (or between tile IB and draw IB)
- */
-enum fd_render_stage {
-	FD_STAGE_NULL     = 0x00,
-	FD_STAGE_DRAW     = 0x01,
-	FD_STAGE_CLEAR    = 0x02,
-	/* TODO before queries which include MEM2GMEM or GMEM2MEM will
-	 * work we will need to call fd_hw_query_prepare() from somewhere
-	 * appropriate so that queries in the tiling IB get backed with
-	 * memory to write results to.
-	 */
-	FD_STAGE_MEM2GMEM = 0x04,
-	FD_STAGE_GMEM2MEM = 0x08,
-	/* used for driver internal draws (ie. util_blitter_blit()): */
-	FD_STAGE_BLIT     = 0x10,
-};
-
-#define MAX_HW_SAMPLE_PROVIDERS 4
-struct fd_hw_sample_provider;
-struct fd_hw_sample;
-
 struct fd_context {
 	struct pipe_context base;

 	struct fd_device *dev;
 	struct fd_screen *screen;
-
 	struct blitter_context *blitter;
 	struct primconvert_context *primconvert;

-	/* slab for pipe_transfer allocations: */
 	struct util_slab_mempool transfer_pool;

-	/* slabs for fd_hw_sample and fd_hw_sample_period allocations: */
-	struct util_slab_mempool sample_pool;
-	struct util_slab_mempool sample_period_pool;
-
-	/* next sample offset.. incremented for each sample in the batch/
-	 * submit, reset to zero on next submit.
-	 */
-	uint32_t next_sample_offset;
-
-	/* sample-providers for hw queries: */
-	const struct fd_hw_sample_provider *sample_providers[MAX_HW_SAMPLE_PROVIDERS];
-
-	/* cached samples (in case multiple queries need to reference
-	 * the same sample snapshot)
-	 */
-	struct fd_hw_sample *sample_cache[MAX_HW_SAMPLE_PROVIDERS];
-
-	/* tracking for current stage, to know when to start/stop
-	 * any active queries:
-	 */
-	enum fd_render_stage stage;
-
-	/* list of active queries: */
-	struct list_head active_queries;
-
-	/* list of queries that are not active, but were active in the
-	 * current submit:
-	 */
-	struct list_head current_queries;
-
-	/* current query result bo and tile stride: */
-	struct fd_bo *query_bo;
-	uint32_t query_tile_stride;
-
 	/* table with PIPE_PRIM_MAX entries mapping PIPE_PRIM_x to
 	 * DI_PT_x value to use for draw initiator.  There are some
 	 * slight differences between generation:
--- a/src/gallium/drivers/freedreno/freedreno_draw.c
+++ b/src/gallium/drivers/freedreno/freedreno_draw.c
@@ -36,7 +36,6 @@
 #include "freedreno_context.h"
 #include "freedreno_state.h"
 #include "freedreno_resource.h"
-#include "freedreno_query_hw.h"
 #include "freedreno_util.h"


@@ -71,7 +70,7 @@ fd_draw_emit(struct fd_context *ctx, struct fd_ringbuffer *ring,
 		idx_bo = fd_resource(idx->buffer)->bo;
 		idx_type = size2indextype(idx->index_size);
 		idx_size = idx->index_size * info->count;
-		idx_offset = idx->offset + (info->start * idx->index_size);
+		idx_offset = idx->offset;
 		src_sel = DI_SRC_SEL_DMA;
 	} else {
 		idx_bo = NULL;
@@ -157,7 +156,6 @@ fd_draw_vbo(struct pipe_context *pctx, const struct pipe_draw_info *info)
 	/* and any buffers used, need to be resolved: */
 	ctx->resolve |= buffers;

-	fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_DRAW);
 	ctx->draw(ctx, info);
 }

@@ -190,8 +188,6 @@ fd_clear(struct pipe_context *pctx, unsigned buffers,
 		util_format_short_name(pipe_surface_format(pfb->cbufs[0])),
 		util_format_short_name(pipe_surface_format(pfb->zsbuf)));

-	fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_CLEAR);
-
 	ctx->clear(ctx, buffers, color, depth, stencil);

 	ctx->dirty |= FD_DIRTY_ZSA |
--- a/src/gallium/drivers/freedreno/freedreno_gmem.c
+++ b/src/gallium/drivers/freedreno/freedreno_gmem.c
@@ -35,7 +35,6 @@
 #include "freedreno_gmem.h"
 #include "freedreno_context.h"
 #include "freedreno_resource.h"
-#include "freedreno_query_hw.h"
 #include "freedreno_util.h"

 /*
@@ -274,24 +273,17 @@ render_tiles(struct fd_context *ctx)

 		ctx->emit_tile_prep(ctx, tile);

-		if (ctx->restore) {
-			fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_MEM2GMEM);
+		if (ctx->restore)
 			ctx->emit_tile_mem2gmem(ctx, tile);
-			fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_NULL);
-		}

 		ctx->emit_tile_renderprep(ctx, tile);

-		fd_hw_query_prepare_tile(ctx, i, ctx->ring);
-
 		/* emit IB to drawcmds: */
 		OUT_IB(ctx->ring, ctx->draw_start, ctx->draw_end);
 		fd_reset_wfi(ctx);

 		/* emit gmem2mem to transfer tile back to system memory: */
-		fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_GMEM2MEM);
 		ctx->emit_tile_gmem2mem(ctx, tile);
-		fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_NULL);
 	}
 }

@@ -300,8 +292,6 @@ render_sysmem(struct fd_context *ctx)
 {
 	ctx->emit_sysmem_prep(ctx);

-	fd_hw_query_prepare_tile(ctx, 0, ctx->ring);
-
 	/* emit IB to drawcmds: */
 	OUT_IB(ctx->ring, ctx->draw_start, ctx->draw_end);
 	fd_reset_wfi(ctx);
@@ -324,11 +314,6 @@ fd_gmem_render_tiles(struct pipe_context *pctx)
 		}
 	}

-	/* close out the draw cmds by making sure any active queries are
-	 * paused:
-	 */
-	fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_NULL);
-
 	/* mark the end of the clear/draw cmds before emitting per-tile cmds: */
 	fd_ringmarker_mark(ctx->draw_end);
 	fd_ringmarker_mark(ctx->binning_end);
@@ -341,7 +326,6 @@ fd_gmem_render_tiles(struct pipe_context *pctx)
 		DBG("rendering sysmem (%s/%s)",
 			util_format_short_name(pipe_surface_format(pfb->cbufs[0])),
 			util_format_short_name(pipe_surface_format(pfb->zsbuf)));
-		fd_hw_query_prepare(ctx, 1);
 		render_sysmem(ctx);
 		ctx->stats.batch_sysmem++;
 	} else {
@@ -350,7 +334,6 @@ fd_gmem_render_tiles(struct pipe_context *pctx)
 		DBG("rendering %dx%d tiles (%s/%s)", gmem->nbins_x, gmem->nbins_y,
 			util_format_short_name(pipe_surface_format(pfb->cbufs[0])),
 			util_format_short_name(pipe_surface_format(pfb->zsbuf)));
-		fd_hw_query_prepare(ctx, gmem->nbins_x * gmem->nbins_y);
 		render_tiles(ctx);
 		ctx->stats.batch_gmem++;
 	}
--- a/src/gallium/drivers/freedreno/freedreno_query.c
+++ b/src/gallium/drivers/freedreno/freedreno_query.c
@@ -1,7 +1,7 @@
 /* -*- mode: C; c-file-style: "k&r"; ttxab-width 4; indent-tabs-mode: t; -*- */

 /*
- * Copyright (C) 2013 Rob Clark <robclark@freedesktop.org>
+ * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
@@ -27,27 +27,63 @@
 */

 #include "pipe/p_state.h"
+#include "util/u_string.h"
 #include "util/u_memory.h"
+#include "util/u_inlines.h"
+#include "os/os_time.h"

 #include "freedreno_query.h"
-#include "freedreno_query_sw.h"
-#include "freedreno_query_hw.h"
 #include "freedreno_context.h"
 #include "freedreno_util.h"

-/*
- * Pipe Query interface:
+#define FD_QUERY_DRAW_CALLS      (PIPE_QUERY_DRIVER_SPECIFIC + 0)
+#define FD_QUERY_BATCH_TOTAL     (PIPE_QUERY_DRIVER_SPECIFIC + 1)  /* total # of batches (submits) */
+#define FD_QUERY_BATCH_SYSMEM    (PIPE_QUERY_DRIVER_SPECIFIC + 2)  /* batches using system memory (GMEM bypass) */
+#define FD_QUERY_BATCH_GMEM      (PIPE_QUERY_DRIVER_SPECIFIC + 3)  /* batches using GMEM */
+#define FD_QUERY_BATCH_RESTORE   (PIPE_QUERY_DRIVER_SPECIFIC + 4)  /* batches requiring GMEM restore */
+
+/* Currently just simple cpu query's supported.. probably need
+ * to refactor this a bit when I'm eventually ready to add gpu
+ * queries:
 */
+struct fd_query {
+	int type;
+	/* storage for the collected data */
+	union pipe_query_result data;
+	bool active;
+	uint64_t begin_value, end_value;
+	uint64_t begin_time, end_time;
+};
+
+static inline struct fd_query *
+fd_query(struct pipe_query *pq)
+{
+	return (struct fd_query *)pq;
+}

 static struct pipe_query *
 fd_create_query(struct pipe_context *pctx, unsigned query_type)
 {
-	struct fd_context *ctx = fd_context(pctx);
 	struct fd_query *q;

-	q = fd_sw_create_query(ctx, query_type);
+	switch (query_type) {
+	case PIPE_QUERY_PRIMITIVES_GENERATED:
+	case PIPE_QUERY_PRIMITIVES_EMITTED:
+	case FD_QUERY_DRAW_CALLS:
+	case FD_QUERY_BATCH_TOTAL:
+	case FD_QUERY_BATCH_SYSMEM:
+	case FD_QUERY_BATCH_GMEM:
+	case FD_QUERY_BATCH_RESTORE:
+		break;
+	default:
+		return NULL;
+	}
+
+	q = CALLOC_STRUCT(fd_query);
 	if (!q)
-		q = fd_hw_create_query(ctx, query_type);
+		return NULL;
+
+	q->type = query_type;

 	return (struct pipe_query *) q;
 }
@@ -56,21 +92,64 @@ static void
 fd_destroy_query(struct pipe_context *pctx, struct pipe_query *pq)
 {
 	struct fd_query *q = fd_query(pq);
-	q->funcs->destroy_query(fd_context(pctx), q);
+	free(q);
+}
+
+static uint64_t
+read_counter(struct pipe_context *pctx, int type)
+{
+	struct fd_context *ctx = fd_context(pctx);
+	switch (type) {
+	case PIPE_QUERY_PRIMITIVES_GENERATED:
+		/* for now same thing as _PRIMITIVES_EMITTED */
+	case PIPE_QUERY_PRIMITIVES_EMITTED:
+		return ctx->stats.prims_emitted;
+	case FD_QUERY_DRAW_CALLS:
+		return ctx->stats.draw_calls;
+	case FD_QUERY_BATCH_TOTAL:
+		return ctx->stats.batch_total;
+	case FD_QUERY_BATCH_SYSMEM:
+		return ctx->stats.batch_sysmem;
+	case FD_QUERY_BATCH_GMEM:
+		return ctx->stats.batch_gmem;
+	case FD_QUERY_BATCH_RESTORE:
+		return ctx->stats.batch_restore;
+	}
+	return 0;
+}
+
+static bool
+is_rate_query(struct fd_query *q)
+{
+	switch (q->type) {
+	case FD_QUERY_BATCH_TOTAL:
+	case FD_QUERY_BATCH_SYSMEM:
+	case FD_QUERY_BATCH_GMEM:
+	case FD_QUERY_BATCH_RESTORE:
+		return true;
+	default:
+		return false;
+	}
 }

 static void
 fd_begin_query(struct pipe_context *pctx, struct pipe_query *pq)
 {
 	struct fd_query *q = fd_query(pq);
-	q->funcs->begin_query(fd_context(pctx), q);
+	q->active = true;
+	q->begin_value = read_counter(pctx, q->type);
+	if (is_rate_query(q))
+		q->begin_time = os_time_get();
 }

 static void
 fd_end_query(struct pipe_context *pctx, struct pipe_query *pq)
 {
 	struct fd_query *q = fd_query(pq);
-	q->funcs->end_query(fd_context(pctx), q);
+	q->active = false;
+	q->end_value = read_counter(pctx, q->type);
+	if (is_rate_query(q))
+		q->end_time = os_time_get();
 }

 static boolean
@@ -78,7 +157,21 @@ fd_get_query_result(struct pipe_context *pctx, struct pipe_query *pq,
 		boolean wait, union pipe_query_result *result)
 {
 	struct fd_query *q = fd_query(pq);
-	return q->funcs->get_query_result(fd_context(pctx), q, wait, result);
+
+	if (q->active)
+		return false;
+
+	util_query_clear_result(result, q->type);
+
+	result->u64 = q->end_value - q->begin_value;
+
+	if (is_rate_query(q)) {
+		double fps = (result->u64 * 1000000) /
+				(double)(q->end_time - q->begin_time);
+		result->u64 = (uint64_t)fps;
+	}
+
+	return true;
 }

 static int
--- a/src/gallium/drivers/freedreno/freedreno_query.h
+++ b/src/gallium/drivers/freedreno/freedreno_query.h
@@ -1,7 +1,7 @@
 /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */

 /*
- * Copyright (C) 2013 Rob Clark <robclark@freedesktop.org>
+ * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
@@ -31,37 +31,6 @@

 #include "pipe/p_context.h"

-struct fd_context;
-struct fd_query;
-
-struct fd_query_funcs {
-	void (*destroy_query)(struct fd_context *ctx,
-			struct fd_query *q);
-	void (*begin_query)(struct fd_context *ctx, struct fd_query *q);
-	void (*end_query)(struct fd_context *ctx, struct fd_query *q);
-	boolean (*get_query_result)(struct fd_context *ctx,
-			struct fd_query *q, boolean wait,
-			union pipe_query_result *result);
-};
-
-struct fd_query {
-	const struct fd_query_funcs *funcs;
-	bool active;
-	int type;
-};
-
-static inline struct fd_query *
-fd_query(struct pipe_query *pq)
-{
-	return (struct fd_query *)pq;
-}
-
-#define FD_QUERY_DRAW_CALLS      (PIPE_QUERY_DRIVER_SPECIFIC + 0)
-#define FD_QUERY_BATCH_TOTAL     (PIPE_QUERY_DRIVER_SPECIFIC + 1)  /* total # of batches (submits) */
-#define FD_QUERY_BATCH_SYSMEM    (PIPE_QUERY_DRIVER_SPECIFIC + 2)  /* batches using system memory (GMEM bypass) */
-#define FD_QUERY_BATCH_GMEM      (PIPE_QUERY_DRIVER_SPECIFIC + 3)  /* batches using GMEM */
-#define FD_QUERY_BATCH_RESTORE   (PIPE_QUERY_DRIVER_SPECIFIC + 4)  /* batches requiring GMEM restore */
-
 void fd_query_screen_init(struct pipe_screen *pscreen);
 void fd_query_context_init(struct pipe_context *pctx);

--- a/src/gallium/drivers/freedreno/freedreno_query_hw.c
+++ b/src/gallium/drivers/freedreno/freedreno_query_hw.c
@@ -1,465 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#include "pipe/p_state.h"
-#include "util/u_memory.h"
-#include "util/u_inlines.h"
-
-#include "freedreno_query_hw.h"
-#include "freedreno_context.h"
-#include "freedreno_util.h"
-
-struct fd_hw_sample_period {
-	struct fd_hw_sample *start, *end;
-	struct list_head list;
-};
-
-/* maps query_type to sample provider idx: */
-static int pidx(unsigned query_type)
-{
-	switch (query_type) {
-	case PIPE_QUERY_OCCLUSION_COUNTER:
-		return 0;
-	case PIPE_QUERY_OCCLUSION_PREDICATE:
-		return 1;
-	default:
-		return -1;
-	}
-}
-
-static struct fd_hw_sample *
-get_sample(struct fd_context *ctx, struct fd_ringbuffer *ring,
-		unsigned query_type)
-{
-	struct fd_hw_sample *samp = NULL;
-	int idx = pidx(query_type);
-
-	if (!ctx->sample_cache[idx]) {
-		ctx->sample_cache[idx] =
-			ctx->sample_providers[idx]->get_sample(ctx, ring);
-	}
-
-	fd_hw_sample_reference(ctx, &samp, ctx->sample_cache[idx]);
-
-	return samp;
-}
-
-static void
-clear_sample_cache(struct fd_context *ctx)
-{
-	int i;
-
-	for (i = 0; i < ARRAY_SIZE(ctx->sample_cache); i++)
-		fd_hw_sample_reference(ctx, &ctx->sample_cache[i], NULL);
-}
-
-static bool
-is_active(struct fd_hw_query *hq, enum fd_render_stage stage)
-{
-	return !!(hq->provider->active & stage);
-}
-
-
-static void
-resume_query(struct fd_context *ctx, struct fd_hw_query *hq,
-		struct fd_ringbuffer *ring)
-{
-	assert(!hq->period);
-	hq->period = util_slab_alloc(&ctx->sample_period_pool);
-	list_inithead(&hq->period->list);
-	hq->period->start = get_sample(ctx, ring, hq->base.type);
-	/* NOTE: util_slab_alloc() does not zero out the buffer: */
-	hq->period->end = NULL;
-}
-
-static void
-pause_query(struct fd_context *ctx, struct fd_hw_query *hq,
-		struct fd_ringbuffer *ring)
-{
-	assert(hq->period && !hq->period->end);
-	hq->period->end = get_sample(ctx, ring, hq->base.type);
-	list_addtail(&hq->period->list, &hq->current_periods);
-	hq->period = NULL;
-}
-
-static void
-destroy_periods(struct fd_context *ctx, struct list_head *list)
-{
-	struct fd_hw_sample_period *period, *s;
-	LIST_FOR_EACH_ENTRY_SAFE(period, s, list, list) {
-		fd_hw_sample_reference(ctx, &period->start, NULL);
-		fd_hw_sample_reference(ctx, &period->end, NULL);
-		list_del(&period->list);
-		util_slab_free(&ctx->sample_period_pool, period);
-	}
-}
-
-static void
-fd_hw_destroy_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_hw_query *hq = fd_hw_query(q);
-
-	destroy_periods(ctx, &hq->periods);
-	destroy_periods(ctx, &hq->current_periods);
-	list_del(&hq->list);
-
-	free(hq);
-}
-
-static void
-fd_hw_begin_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_hw_query *hq = fd_hw_query(q);
-	if (q->active)
-		return;
-
-	/* begin_query() should clear previous results: */
-	destroy_periods(ctx, &hq->periods);
-
-	if (is_active(hq, ctx->stage))
-		resume_query(ctx, hq, ctx->ring);
-
-	q->active = true;
-
-	/* add to active list: */
-	list_del(&hq->list);
-	list_addtail(&hq->list, &ctx->active_queries);
-}
-
-static void
-fd_hw_end_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_hw_query *hq = fd_hw_query(q);
-	if (!q->active)
-		return;
-	if (is_active(hq, ctx->stage))
-		pause_query(ctx, hq, ctx->ring);
-	q->active = false;
-	/* move to current list: */
-	list_del(&hq->list);
-	list_addtail(&hq->list, &ctx->current_queries);
-}
-
-/* helper to get ptr to specified sample: */
-static void * sampptr(struct fd_hw_sample *samp, uint32_t n, void *ptr)
-{
-	return ((char *)ptr) + (samp->tile_stride * n) + samp->offset;
-}
-
-static boolean
-fd_hw_get_query_result(struct fd_context *ctx, struct fd_query *q,
-		boolean wait, union pipe_query_result *result)
-{
-	struct fd_hw_query *hq = fd_hw_query(q);
-	const struct fd_hw_sample_provider *p = hq->provider;
-	struct fd_hw_sample_period *period;
-
-	if (q->active)
-		return false;
-
-	/* if the app tries to read back the query result before the
-	 * back is submitted, that forces us to flush so that there
-	 * are actually results to wait for:
-	 */
-	if (!LIST_IS_EMPTY(&hq->list)) {
-		DBG("reading query result forces flush!");
-		ctx->needs_flush = true;
-		fd_context_render(&ctx->base);
-	}
-
-	util_query_clear_result(result, q->type);
-
-	if (LIST_IS_EMPTY(&hq->periods))
-		return true;
-
-	assert(LIST_IS_EMPTY(&hq->list));
-	assert(LIST_IS_EMPTY(&hq->current_periods));
-	assert(!hq->period);
-
-	if (LIST_IS_EMPTY(&hq->periods))
-		return true;
-
-	/* if !wait, then check the last sample (the one most likely to
-	 * not be ready yet) and bail if it is not ready:
-	 */
-	if (!wait) {
-		int ret;
-
-		period = LIST_ENTRY(struct fd_hw_sample_period,
-				hq->periods.prev, list);
-
-		ret = fd_bo_cpu_prep(period->end->bo, ctx->screen->pipe,
-				DRM_FREEDRENO_PREP_READ | DRM_FREEDRENO_PREP_NOSYNC);
-		if (ret)
-			return false;
-
-		fd_bo_cpu_fini(period->end->bo);
-	}
-
-	/* sum the result across all sample periods: */
-	LIST_FOR_EACH_ENTRY(period, &hq->periods, list) {
-		struct fd_hw_sample *start = period->start;
-		struct fd_hw_sample *end = period->end;
-		unsigned i;
-
-		/* start and end samples should be from same batch: */
-		assert(start->bo == end->bo);
-		assert(start->num_tiles == end->num_tiles);
-
-		for (i = 0; i < start->num_tiles; i++) {
-			void *ptr;
-
-			fd_bo_cpu_prep(start->bo, ctx->screen->pipe,
-					DRM_FREEDRENO_PREP_READ);
-
-			ptr = fd_bo_map(start->bo);
-
-			p->accumulate_result(ctx, sampptr(period->start, i, ptr),
-					sampptr(period->end, i, ptr), result);
-
-			fd_bo_cpu_fini(start->bo);
-		}
-	}
-
-	return true;
-}
-
-static const struct fd_query_funcs hw_query_funcs = {
-		.destroy_query    = fd_hw_destroy_query,
-		.begin_query      = fd_hw_begin_query,
-		.end_query        = fd_hw_end_query,
-		.get_query_result = fd_hw_get_query_result,
-};
-
-struct fd_query *
-fd_hw_create_query(struct fd_context *ctx, unsigned query_type)
-{
-	struct fd_hw_query *hq;
-	struct fd_query *q;
-	int idx = pidx(query_type);
-
-	if ((idx < 0) || !ctx->sample_providers[idx])
-		return NULL;
-
-	hq = CALLOC_STRUCT(fd_hw_query);
-	if (!hq)
-		return NULL;
-
-	hq->provider = ctx->sample_providers[idx];
-
-	list_inithead(&hq->periods);
-	list_inithead(&hq->current_periods);
-	list_inithead(&hq->list);
-
-	q = &hq->base;
-	q->funcs = &hw_query_funcs;
-	q->type = query_type;
-
-	return q;
-}
-
-struct fd_hw_sample *
-fd_hw_sample_init(struct fd_context *ctx, uint32_t size)
-{
-	struct fd_hw_sample *samp = util_slab_alloc(&ctx->sample_pool);
-	pipe_reference_init(&samp->reference, 1);
-	samp->size = size;
-	samp->offset = ctx->next_sample_offset;
-	/* NOTE: util_slab_alloc() does not zero out the buffer: */
-	samp->bo = NULL;
-	samp->num_tiles = 0;
-	samp->tile_stride = 0;
-	ctx->next_sample_offset += size;
-	return samp;
-}
-
-void
-__fd_hw_sample_destroy(struct fd_context *ctx, struct fd_hw_sample *samp)
-{
-	if (samp->bo)
-		fd_bo_del(samp->bo);
-	util_slab_free(&ctx->sample_pool, samp);
-}
-
-static void
-prepare_sample(struct fd_hw_sample *samp, struct fd_bo *bo,
-		uint32_t num_tiles, uint32_t tile_stride)
-{
-	if (samp->bo) {
-		assert(samp->bo == bo);
-		assert(samp->num_tiles == num_tiles);
-		assert(samp->tile_stride == tile_stride);
-		return;
-	}
-	samp->bo = bo;
-	samp->num_tiles = num_tiles;
-	samp->tile_stride = tile_stride;
-}
-
-static void
-prepare_query(struct fd_hw_query *hq, struct fd_bo *bo,
-		uint32_t num_tiles, uint32_t tile_stride)
-{
-	struct fd_hw_sample_period *period, *s;
-
-	/* prepare all the samples in the query: */
-	LIST_FOR_EACH_ENTRY_SAFE(period, s, &hq->current_periods, list) {
-		prepare_sample(period->start, bo, num_tiles, tile_stride);
-		prepare_sample(period->end, bo, num_tiles, tile_stride);
-
-		/* move from current_periods list to periods list: */
-		list_del(&period->list);
-		list_addtail(&period->list, &hq->periods);
-	}
-}
-
-static void
-prepare_queries(struct fd_context *ctx, struct fd_bo *bo,
-		uint32_t num_tiles, uint32_t tile_stride,
-		struct list_head *list, bool remove)
-{
-	struct fd_hw_query *hq, *s;
-	LIST_FOR_EACH_ENTRY_SAFE(hq, s, list, list) {
-		prepare_query(hq, bo, num_tiles, tile_stride);
-		if (remove)
-			list_delinit(&hq->list);
-	}
-}
-
-/* called from gmem code once total storage requirements are known (ie.
- * number of samples times number of tiles)
- */
-void
-fd_hw_query_prepare(struct fd_context *ctx, uint32_t num_tiles)
-{
-	uint32_t tile_stride = ctx->next_sample_offset;
-	struct fd_bo *bo;
-
-	if (ctx->query_bo)
-		fd_bo_del(ctx->query_bo);
-
-	if (tile_stride > 0) {
-		bo = fd_bo_new(ctx->dev, tile_stride * num_tiles,
-				DRM_FREEDRENO_GEM_CACHE_WCOMBINE |
-				DRM_FREEDRENO_GEM_TYPE_KMEM);
-	} else {
-		bo = NULL;
-	}
-
-	ctx->query_bo = bo;
-	ctx->query_tile_stride = tile_stride;
-
-	prepare_queries(ctx, bo, num_tiles, tile_stride,
-			&ctx->active_queries, false);
-	prepare_queries(ctx, bo, num_tiles, tile_stride,
-			&ctx->current_queries, true);
-
-	/* reset things for next batch: */
-	ctx->next_sample_offset = 0;
-}
-
-void
-fd_hw_query_prepare_tile(struct fd_context *ctx, uint32_t n,
-		struct fd_ringbuffer *ring)
-{
-	uint32_t tile_stride = ctx->query_tile_stride;
-	uint32_t offset = tile_stride * n;
-
-	/* bail if no queries: */
-	if (tile_stride == 0)
-		return;
-
-	fd_wfi(ctx, ring);
-	OUT_PKT0 (ring, HW_QUERY_BASE_REG, 1);
-	OUT_RELOCW(ring, ctx->query_bo, offset, 0, 0);
-}
-
-void
-fd_hw_query_set_stage(struct fd_context *ctx, struct fd_ringbuffer *ring,
-		enum fd_render_stage stage)
-{
-	/* special case: internal blits (like mipmap level generation)
-	 * go through normal draw path (via util_blitter_blit()).. but
-	 * we need to ignore the FD_STAGE_DRAW which will be set, so we
-	 * don't enable queries which should be paused during internal
-	 * blits:
-	 */
-	if ((ctx->stage == FD_STAGE_BLIT) &&
-			(stage != FD_STAGE_NULL))
-		return;
-
-	if (stage != ctx->stage) {
-		struct fd_hw_query *hq;
-		LIST_FOR_EACH_ENTRY(hq, &ctx->active_queries, list) {
-			bool was_active = is_active(hq, ctx->stage);
-			bool now_active = is_active(hq, stage);
-
-			if (now_active && !was_active)
-				resume_query(ctx, hq, ring);
-			else if (was_active && !now_active)
-				pause_query(ctx, hq, ring);
-		}
-	}
-	clear_sample_cache(ctx);
-	ctx->stage = stage;
-}
-
-void
-fd_hw_query_register_provider(struct pipe_context *pctx,
-		const struct fd_hw_sample_provider *provider)
-{
-	struct fd_context *ctx = fd_context(pctx);
-	int idx = pidx(provider->query_type);
-
-	assert((0 <= idx) && (idx < MAX_HW_SAMPLE_PROVIDERS));
-	assert(!ctx->sample_providers[idx]);
-
-	ctx->sample_providers[idx] = provider;
-}
-
-void
-fd_hw_query_init(struct pipe_context *pctx)
-{
-	struct fd_context *ctx = fd_context(pctx);
-
-	util_slab_create(&ctx->sample_pool, sizeof(struct fd_hw_sample),
-			16, UTIL_SLAB_SINGLETHREADED);
-	util_slab_create(&ctx->sample_period_pool, sizeof(struct fd_hw_sample_period),
-			16, UTIL_SLAB_SINGLETHREADED);
-	list_inithead(&ctx->active_queries);
-	list_inithead(&ctx->current_queries);
-}
-
-void
-fd_hw_query_fini(struct pipe_context *pctx)
-{
-	struct fd_context *ctx = fd_context(pctx);
-
-	util_slab_destroy(&ctx->sample_pool);
-	util_slab_destroy(&ctx->sample_period_pool);
-}
--- a/src/gallium/drivers/freedreno/freedreno_query_hw.h
+++ b/src/gallium/drivers/freedreno/freedreno_query_hw.h
@@ -1,164 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#ifndef FREEDRENO_QUERY_HW_H_
-#define FREEDRENO_QUERY_HW_H_
-
-#include "util/u_double_list.h"
-
-#include "freedreno_query.h"
-#include "freedreno_context.h"
-
-
-/*
- * HW Queries:
- *
- * See: https://github.com/freedreno/freedreno/wiki/Queries#hardware-queries
- *
- * Hardware queries will be specific to gpu generation, but they need
- * some common infrastructure for triggering start/stop samples at
- * various points (for example, to exclude mem2gmem/gmem2mem or clear)
- * as well as per tile tracking.
- *
- * NOTE: in at least some cases hw writes sample values to memory addr
- * specified in some register.  So we don't really have the option to
- * just sample the same counter multiple times for multiple different
- * queries with the same query_type.  So we cache per sample provider
- * the most recent sample since the last draw.  This way multiple
- * sample periods for multiple queries can reference the same sample.
- *
- * fd_hw_sample_provider:
- *   - one per query type, registered/implemented by gpu generation
- *     specific code
- *   - can construct fd_hw_samples on demand
- *   - most recent sample (since last draw) cached so multiple
- *     different queries can ref the same sample
- *
- * fd_hw_sample:
- *   - abstracts one snapshot of counter value(s) across N tiles
- *   - backing object not allocated until submit time when number
- *     of samples and number of tiles is known
- *
- * fd_hw_sample_period:
- *   - consists of start and stop sample
- *   - a query accumulates a list of sample periods
- *   - the query result is the sum of the sample periods
- */
-
-struct fd_hw_sample_provider {
-	unsigned query_type;
-
-	/* stages applicable to the query type: */
-	enum fd_render_stage active;
-
-	/* when a new sample is required, emit appropriate cmdstream
-	 * and return a sample object:
-	 */
-	struct fd_hw_sample *(*get_sample)(struct fd_context *ctx,
-			struct fd_ringbuffer *ring);
-
-	/* accumulate the results from specified sample period: */
-	void (*accumulate_result)(struct fd_context *ctx,
-			const void *start, const void *end,
-			union pipe_query_result *result);
-};
-
-struct fd_hw_sample {
-	struct pipe_reference reference;  /* keep this first */
-
-	/* offset and size of the sample are know at the time the
-	 * sample is constructed.
-	 */
-	uint32_t size;
-	uint32_t offset;
-
-	/* backing object, offset/stride/etc are determined not when
-	 * the sample is constructed, but when the batch is submitted.
-	 * This way we can defer allocation until total # of requested
-	 * samples, and total # of tiles, is known.
-	 */
-	struct fd_bo *bo;
-	uint32_t num_tiles;
-	uint32_t tile_stride;
-};
-
-struct fd_hw_sample_period;
-
-struct fd_hw_query {
-	struct fd_query base;
-
-	const struct fd_hw_sample_provider *provider;
-
-	/* list of fd_hw_sample_period in previous submits: */
-	struct list_head periods;
-
-	/* list of fd_hw_sample_period's in current submit: */
-	struct list_head current_periods;
-
-	/* if active and not paused, the current sample period (not
-	 * yet added to current_periods):
-	 */
-	struct fd_hw_sample_period *period;
-
-	struct list_head list;  /* list-node in ctx->active_queries */
-};
-
-static inline struct fd_hw_query *
-fd_hw_query(struct fd_query *q)
-{
-	return (struct fd_hw_query *)q;
-}
-
-struct fd_query * fd_hw_create_query(struct fd_context *ctx, unsigned query_type);
-/* helper for sample providers: */
-struct fd_hw_sample * fd_hw_sample_init(struct fd_context *ctx, uint32_t size);
-/* don't call directly, use fd_hw_sample_reference() */
-void __fd_hw_sample_destroy(struct fd_context *ctx, struct fd_hw_sample *samp);
-void fd_hw_query_prepare(struct fd_context *ctx, uint32_t num_tiles);
-void fd_hw_query_prepare_tile(struct fd_context *ctx, uint32_t n,
-		struct fd_ringbuffer *ring);
-void fd_hw_query_set_stage(struct fd_context *ctx,
-		struct fd_ringbuffer *ring, enum fd_render_stage stage);
-void fd_hw_query_register_provider(struct pipe_context *pctx,
-		const struct fd_hw_sample_provider *provider);
-void fd_hw_query_init(struct pipe_context *pctx);
-void fd_hw_query_fini(struct pipe_context *pctx);
-
-static inline void
-fd_hw_sample_reference(struct fd_context *ctx,
-		struct fd_hw_sample **ptr, struct fd_hw_sample *samp)
-{
-	struct fd_hw_sample *old_samp = *ptr;
-
-	if (pipe_reference(&(*ptr)->reference, &samp->reference))
-		__fd_hw_sample_destroy(ctx, old_samp);
-	if (ptr)
-		*ptr = samp;
-}
-
-#endif /* FREEDRENO_QUERY_HW_H_ */
--- a/src/gallium/drivers/freedreno/freedreno_query_sw.c
+++ b/src/gallium/drivers/freedreno/freedreno_query_sw.c
@@ -1,165 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#include "pipe/p_state.h"
-#include "util/u_string.h"
-#include "util/u_memory.h"
-#include "util/u_inlines.h"
-#include "os/os_time.h"
-
-#include "freedreno_query_sw.h"
-#include "freedreno_context.h"
-#include "freedreno_util.h"
-
-/*
- * SW Queries:
- *
- * In the core, we have some support for basic sw counters
- */
-
-static void
-fd_sw_destroy_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_sw_query *sq = fd_sw_query(q);
-	free(sq);
-}
-
-static uint64_t
-read_counter(struct fd_context *ctx, int type)
-{
-	switch (type) {
-	case PIPE_QUERY_PRIMITIVES_GENERATED:
-		/* for now same thing as _PRIMITIVES_EMITTED */
-	case PIPE_QUERY_PRIMITIVES_EMITTED:
-		return ctx->stats.prims_emitted;
-	case FD_QUERY_DRAW_CALLS:
-		return ctx->stats.draw_calls;
-	case FD_QUERY_BATCH_TOTAL:
-		return ctx->stats.batch_total;
-	case FD_QUERY_BATCH_SYSMEM:
-		return ctx->stats.batch_sysmem;
-	case FD_QUERY_BATCH_GMEM:
-		return ctx->stats.batch_gmem;
-	case FD_QUERY_BATCH_RESTORE:
-		return ctx->stats.batch_restore;
-	}
-	return 0;
-}
-
-static bool
-is_rate_query(struct fd_query *q)
-{
-	switch (q->type) {
-	case FD_QUERY_BATCH_TOTAL:
-	case FD_QUERY_BATCH_SYSMEM:
-	case FD_QUERY_BATCH_GMEM:
-	case FD_QUERY_BATCH_RESTORE:
-		return true;
-	default:
-		return false;
-	}
-}
-
-static void
-fd_sw_begin_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_sw_query *sq = fd_sw_query(q);
-	q->active = true;
-	sq->begin_value = read_counter(ctx, q->type);
-	if (is_rate_query(q))
-		sq->begin_time = os_time_get();
-}
-
-static void
-fd_sw_end_query(struct fd_context *ctx, struct fd_query *q)
-{
-	struct fd_sw_query *sq = fd_sw_query(q);
-	q->active = false;
-	sq->end_value = read_counter(ctx, q->type);
-	if (is_rate_query(q))
-		sq->end_time = os_time_get();
-}
-
-static boolean
-fd_sw_get_query_result(struct fd_context *ctx, struct fd_query *q,
-		boolean wait, union pipe_query_result *result)
-{
-	struct fd_sw_query *sq = fd_sw_query(q);
-
-	if (q->active)
-		return false;
-
-	util_query_clear_result(result, q->type);
-
-	result->u64 = sq->end_value - sq->begin_value;
-
-	if (is_rate_query(q)) {
-		double fps = (result->u64 * 1000000) /
-				(double)(sq->end_time - sq->begin_time);
-		result->u64 = (uint64_t)fps;
-	}
-
-	return true;
-}
-
-static const struct fd_query_funcs sw_query_funcs = {
-		.destroy_query    = fd_sw_destroy_query,
-		.begin_query      = fd_sw_begin_query,
-		.end_query        = fd_sw_end_query,
-		.get_query_result = fd_sw_get_query_result,
-};
-
-struct fd_query *
-fd_sw_create_query(struct fd_context *ctx, unsigned query_type)
-{
-	struct fd_sw_query *sq;
-	struct fd_query *q;
-
-	switch (query_type) {
-	case PIPE_QUERY_PRIMITIVES_GENERATED:
-	case PIPE_QUERY_PRIMITIVES_EMITTED:
-	case FD_QUERY_DRAW_CALLS:
-	case FD_QUERY_BATCH_TOTAL:
-	case FD_QUERY_BATCH_SYSMEM:
-	case FD_QUERY_BATCH_GMEM:
-	case FD_QUERY_BATCH_RESTORE:
-		break;
-	default:
-		return NULL;
-	}
-
-	sq = CALLOC_STRUCT(fd_sw_query);
-	if (!sq)
-		return NULL;
-
-	q = &sq->base;
-	q->funcs = &sw_query_funcs;
-	q->type = query_type;
-
-	return q;
-}
--- a/src/gallium/drivers/freedreno/freedreno_query_sw.h
+++ b/src/gallium/drivers/freedreno/freedreno_query_sw.h
@@ -1,55 +0,0 @@
-/* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
-
-/*
- * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- *
- * Authors:
- *    Rob Clark <robclark@freedesktop.org>
- */
-
-#ifndef FREEDRENO_QUERY_SW_H_
-#define FREEDRENO_QUERY_SW_H_
-
-#include "freedreno_query.h"
-
-/*
- * SW Queries:
- *
- * In the core, we have some support for basic sw counters
- */
-
-struct fd_sw_query {
-	struct fd_query base;
-	uint64_t begin_value, end_value;
-	uint64_t begin_time, end_time;
-};
-
-static inline struct fd_sw_query *
-fd_sw_query(struct fd_query *q)
-{
-	return (struct fd_sw_query *)q;
-}
-
-struct fd_query * fd_sw_create_query(struct fd_context *ctx,
-		unsigned query_type);
-
-#endif /* FREEDRENO_QUERY_SW_H_ */
--- a/src/gallium/drivers/freedreno/freedreno_resource.c
+++ b/src/gallium/drivers/freedreno/freedreno_resource.c
@@ -36,7 +36,6 @@
 #include "freedreno_screen.h"
 #include "freedreno_surface.h"
 #include "freedreno_context.h"
-#include "freedreno_query_hw.h"
 #include "freedreno_util.h"

 #include <errno.h>
@@ -48,10 +47,6 @@ realloc_bo(struct fd_resource *rsc, uint32_t size)
 	uint32_t flags = DRM_FREEDRENO_GEM_CACHE_WCOMBINE |
 			DRM_FREEDRENO_GEM_TYPE_KMEM; /* TODO */

-	/* if we start using things other than write-combine,
-	 * be sure to check for PIPE_RESOURCE_FLAG_MAP_COHERENT
-	 */
-
 	if (rsc->bo)
 		fd_bo_del(rsc->bo);

@@ -406,9 +401,7 @@ render_blit(struct pipe_context *pctx, struct pipe_blit_info *info)
 	util_blitter_save_fragment_sampler_views(ctx->blitter,
 			ctx->fragtex.num_textures, ctx->fragtex.textures);

-	fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_BLIT);
 	util_blitter_blit(ctx->blitter, info);
-	fd_hw_query_set_stage(ctx, ctx->ring, FD_STAGE_NULL);

 	return true;
 }
--- a/src/gallium/drivers/freedreno/freedreno_screen.c
+++ b/src/gallium/drivers/freedreno/freedreno_screen.c
@@ -50,8 +50,8 @@
 #include "freedreno_query.h"
 #include "freedreno_util.h"

-#include "a2xx/fd2_screen.h"
-#include "a3xx/fd3_screen.h"
+#include "fd2_screen.h"
+#include "fd3_screen.h"

 /* XXX this should go away */
 #include "state_tracker/drm_driver.h"
@@ -143,8 +143,6 @@ tables for things that differ if the delta is not too much..
 static int
 fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 {
-	struct fd_screen *screen = fd_screen(pscreen);
-
 	/* this is probably not totally correct.. but it's a start: */
 	switch (param) {
 	/* Supported features (boolean caps). */
@@ -161,7 +159,11 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 	case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
 	case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
 	case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
+	case PIPE_CAP_SM3:
 	case PIPE_CAP_SEAMLESS_CUBE_MAP:
+	case PIPE_CAP_PRIMITIVE_RESTART:
+	case PIPE_CAP_CONDITIONAL_RENDER:
+	case PIPE_CAP_TEXTURE_BARRIER:
 	case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
 	case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
 	case PIPE_CAP_TGSI_INSTANCEID:
@@ -171,18 +173,13 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 	case PIPE_CAP_COMPUTE:
 	case PIPE_CAP_START_INSTANCE:
 	case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
+	case PIPE_CAP_TEXTURE_MULTISAMPLE:
 	case PIPE_CAP_USER_CONSTANT_BUFFERS:
-	case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
 		return 1;

 	case PIPE_CAP_SHADER_STENCIL_EXPORT:
 	case PIPE_CAP_TGSI_TEXCOORD:
 	case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
-	case PIPE_CAP_CONDITIONAL_RENDER:
-	case PIPE_CAP_PRIMITIVE_RESTART:
-	case PIPE_CAP_TEXTURE_MULTISAMPLE:
-	case PIPE_CAP_TEXTURE_BARRIER:
-	case PIPE_CAP_SM3:
 		return 0;

 	case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
@@ -208,6 +205,7 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
        case PIPE_CAP_TGSI_VS_LAYER:
 	case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
 	case PIPE_CAP_TEXTURE_GATHER_SM5:
+        case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
        case PIPE_CAP_FAKE_SW_MSAA:
 	case PIPE_CAP_TEXTURE_QUERY_LOD:
        case PIPE_CAP_SAMPLE_SHADING:
@@ -231,18 +229,17 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 	case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
 		return MAX_MIP_LEVELS;
 	case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
-		return 0;  /* TODO: a3xx+ should support (required in gles3) */
+		return 9192;

 	/* Render targets. */
 	case PIPE_CAP_MAX_RENDER_TARGETS:
 		return 1;

-	/* Queries. */
+	/* Timer queries. */
 	case PIPE_CAP_QUERY_TIME_ELAPSED:
+	case PIPE_CAP_OCCLUSION_QUERY:
 	case PIPE_CAP_QUERY_TIMESTAMP:
 		return 0;
-	case PIPE_CAP_OCCLUSION_QUERY:
-		return (screen->gpu_id >= 300) ? 1: 0;

 	case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
 	case PIPE_CAP_MIN_TEXEL_OFFSET:
@@ -255,7 +252,7 @@ fd_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
 	case PIPE_CAP_ENDIANNESS:
 		return PIPE_ENDIAN_LITTLE;

-	case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
+        case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
 		return 64;

 	default:
@@ -318,7 +315,7 @@ fd_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
 	case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
 		return 8; /* XXX */
 	case PIPE_SHADER_CAP_MAX_INPUTS:
-		return 16;
+		return 32;
 	case PIPE_SHADER_CAP_MAX_TEMPS:
 		return 64; /* Max native temporaries. */
 	case PIPE_SHADER_CAP_MAX_ADDRS:
--- a/src/gallium/drivers/freedreno/freedreno_texture.c
+++ b/src/gallium/drivers/freedreno/freedreno_texture.c
@@ -57,7 +57,7 @@ static void bind_sampler_states(struct fd_texture_stateobj *prog,

 	for (i = 0; i < nr; i++) {
 		if (hwcso[i])
-			new_nr = i + 1;
+			new_nr++;
 		prog->samplers[i] = hwcso[i];
 		prog->dirty_samplers |= (1 << i);
 	}
@@ -78,7 +78,7 @@ static void set_sampler_views(struct fd_texture_stateobj *prog,

 	for (i = 0; i < nr; i++) {
 		if (views[i])
-			new_nr = i + 1;
+			new_nr++;
 		pipe_sampler_view_reference(&prog->textures[i], views[i]);
 		prog->dirty_samplers |= (1 << i);
 	}
--- a/src/gallium/drivers/freedreno/freedreno_util.c
+++ b/src/gallium/drivers/freedreno/freedreno_util.c
@@ -111,6 +111,26 @@ fd_blend_factor(unsigned factor)
 	}
 }

+enum adreno_rb_blend_opcode
+fd_blend_func(unsigned func)
+{
+	switch (func) {
+	case PIPE_BLEND_ADD:
+		return BLEND_DST_PLUS_SRC;
+	case PIPE_BLEND_MIN:
+		return BLEND_MIN_DST_SRC;
+	case PIPE_BLEND_MAX:
+		return BLEND_MAX_DST_SRC;
+	case PIPE_BLEND_SUBTRACT:
+		return BLEND_SRC_MINUS_DST;
+	case PIPE_BLEND_REVERSE_SUBTRACT:
+		return BLEND_DST_MINUS_SRC;
+	default:
+		DBG("invalid blend func: %x", func);
+		return 0;
+	}
+}
+
 enum adreno_pa_su_sc_draw
 fd_polygon_mode(unsigned mode)
 {
--- a/src/gallium/drivers/freedreno/freedreno_util.h
+++ b/src/gallium/drivers/freedreno/freedreno_util.h
@@ -45,6 +45,7 @@
 enum adreno_rb_depth_format fd_pipe2depth(enum pipe_format format);
 enum pc_di_index_size fd_pipe2index(enum pipe_format format);
 enum adreno_rb_blend_factor fd_blend_factor(unsigned factor);
+enum adreno_rb_blend_opcode fd_blend_func(unsigned func);
 enum adreno_pa_su_sc_draw fd_polygon_mode(unsigned mode);
 enum adreno_stencil_op fd_stencil_op(unsigned op);

@@ -222,18 +223,11 @@ OUT_IB(struct fd_ringbuffer *ring, struct fd_ringmarker *start,
 	emit_marker(ring, 6);
 }

-/* CP_SCRATCH_REG4 is used to hold base address for query results: */
-#define HW_QUERY_BASE_REG REG_AXXX_CP_SCRATCH_REG4
-
 static inline void
 emit_marker(struct fd_ringbuffer *ring, int scratch_idx)
 {
 	extern unsigned marker_cnt;
-	unsigned reg = REG_AXXX_CP_SCRATCH_REG0 + scratch_idx;
-	assert(reg != HW_QUERY_BASE_REG);
-	if (reg == HW_QUERY_BASE_REG)
-		return;
-	OUT_PKT0(ring, reg, 1);
+	OUT_PKT0(ring, REG_AXXX_CP_SCRATCH_REG0 + scratch_idx, 1);
 	OUT_RING(ring, ++marker_cnt);
 }

--- a/src/gallium/drivers/llvmpipe/lp_rast.c
+++ b/src/gallium/drivers/llvmpipe/lp_rast.c
@@ -312,15 +312,9 @@ lp_rast_shade_tile(struct lp_rasterizer_task *task,

         /* color buffer */
         for (i = 0; i < scene->fb.nr_cbufs; i++){
-            if (scene->fb.cbufs[i]) {
-               stride[i] = scene->cbufs[i].stride;
-               color[i] = lp_rast_get_unswizzled_color_block_pointer(task, i, tile_x + x,
-                                                                     tile_y + y, inputs->layer);
-            }
-            else {
-               stride[i] = 0;
-               color[i] = NULL;
-            }
+            stride[i] = scene->cbufs[i].stride;
+            color[i] = lp_rast_get_unswizzled_color_block_pointer(task, i, tile_x + x,
+                                                                  tile_y + y, inputs->layer);
         }

         /* depth buffer */
--- a/src/gallium/drivers/llvmpipe/lp_texture.c
+++ b/src/gallium/drivers/llvmpipe/lp_texture.c
@@ -115,7 +115,7 @@ llvmpipe_texture_layout(struct llvmpipe_screen *screen,
            lpr->row_stride[level] = align(nblocksx * block_size, util_cpu_caps.cacheline);

         /* if row_stride * height > LP_MAX_TEXTURE_SIZE */
-         if ((uint64_t)lpr->row_stride[level] * nblocksy > LP_MAX_TEXTURE_SIZE) {
+         if (lpr->row_stride[level] > LP_MAX_TEXTURE_SIZE / nblocksy) {
            /* image too large */
            goto fail;
         }
--- a/src/gallium/drivers/nouveau/Android.mk
+++ b/src/gallium/drivers/nouveau/Android.mk
@@ -28,19 +28,18 @@ include $(LOCAL_PATH)/Makefile.sources

 include $(CLEAR_VARS)

-LOCAL_SRC_FILES := \
-	$(C_SOURCES) \
+LOCAL_SRC_FILES := $(C_SOURCES) \
 	$(NV30_C_SOURCES) \
 	$(NV50_CODEGEN_SOURCES) \
 	$(NV50_C_SOURES) \
 	$(NVC0_CODEGEN_SOURCES) \
 	$(NVC0_C_SOURCES)

-LOCAL_C_INCLUDES := \
-	$(TARGET_OUT_HEADERS)/libdrm
+LOCAL_C_INCLUDES := $(DRM_TOP) \
+	$(DRM_TOP)/include/drm \
+	$(DRM_TOP)/nouveau

 LOCAL_MODULE := libmesa_pipe_nouveau

-include external/stlport/libstlport.mk
 include $(GALLIUM_COMMON_MK)
 include $(BUILD_STATIC_LIBRARY)
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_driver.h
@@ -177,7 +177,6 @@ struct nv50_ir_prog_info
      uint8_t vertexId;          /* system value index of VertexID */
      uint8_t edgeFlagIn;
      uint8_t edgeFlagOut;
-      int8_t viewportId;         /* output index of ViewportIndex */
      uint8_t fragDepth;         /* output index of FragDepth */
      uint8_t sampleMask;        /* output index of SampleMask */
      boolean sampleInterp;      /* perform sample interp on all fp inputs */
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_emit_gk110.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_emit_gk110.cpp
@@ -287,12 +287,10 @@ CodeEmitterGK110::emitPredicate(const Instruction *i)
 void
 CodeEmitterGK110::setCAddress14(const ValueRef& src)
 {
-   const Storage& res = src.get()->asSym()->reg;
-   const int32_t addr = res.data.offset / 4;
+   const int32_t addr = src.get()->asSym()->reg.data.offset / 4;

   code[0] |= (addr & 0x01ff) << 23;
   code[1] |= (addr & 0x3e00) >> 9;
-   code[1] |= res.fileIndex << 5;
 }

 void
@@ -415,6 +413,7 @@ CodeEmitterGK110::emitForm_21(const Instruction *i, uint32_t opc2,
      case FILE_MEMORY_CONST:
         code[1] &= (s == 2) ? ~(0x4 << 28) : ~(0x8 << 28);
         setCAddress14(i->src(s));
+         code[1] |= i->getSrc(s)->reg.fileIndex << 5;
         break;
      case FILE_IMMEDIATE:
         setShortImmediate(i, s);
@@ -556,7 +555,6 @@ CodeEmitterGK110::emitFADD(const Instruction *i)
      RND_(2a, F);
      ABS_(31, 0);
      NEG_(33, 0);
-      SAT_(35);

      if (code[0] & 0x1) {
         modNegAbsF32_3b(i, 1);
@@ -635,7 +633,7 @@ CodeEmitterGK110::emitISAD(const Instruction *i)
 {
   assert(i->dType == TYPE_S32 || i->dType == TYPE_U32);

-   emitForm_21(i, 0x1f4, 0xb74);
+   emitForm_21(i, 0x1fc, 0xb74);

   if (i->dType == TYPE_S32)
      code[1] |= 1 << 19;
@@ -713,7 +711,7 @@ CodeEmitterGK110::emitEXTBF(const Instruction *i)
 void
 CodeEmitterGK110::emitBFIND(const Instruction *i)
 {
-   emitForm_C(i, 0x218, 0x2);
+   emitForm_21(i, 0x618, 0xc18);

   if (i->dType == TYPE_S32)
      code[1] |= 0x80000;
@@ -954,7 +952,7 @@ CodeEmitterGK110::emitSLCT(const CmpInstruction *i)
      FTZ_(32);
      emitCondCode(cc, 0x33, 0xf);
   } else {
-      emitForm_21(i, 0x1a0, 0xb20);
+      emitForm_21(i, 0x1a4, 0xb20);
      emitCondCode(cc, 0x34, 0x7);
   }
 }
@@ -969,7 +967,7 @@ void CodeEmitterGK110::emitSELP(const Instruction *i)

 void CodeEmitterGK110::emitTEXBAR(const Instruction *i)
 {
-   code[0] = 0x0000003e | (i->subOp << 23);
+   code[0] = 0x00000002 | (i->subOp << 23);
   code[1] = 0x77000000;

   emitPredicate(i);
@@ -1206,7 +1204,7 @@ CodeEmitterGK110::emitFlow(const Instruction *i)
   case OP_PRECONT:  code[1] = 0x15800000; mask = 2; break;
   case OP_PRERET:   code[1] = 0x13800000; mask = 2; break;

-   case OP_QUADON:  code[1] = 0x1b800000; mask = 0; break;
+   case OP_QUADON:  code[1] = 0x1b000000; mask = 0; break;
   case OP_QUADPOP: code[1] = 0x1c000000; mask = 0; break;
   case OP_BRKPT:   code[1] = 0x00000000; mask = 0; break;
   default:
@@ -1328,8 +1326,7 @@ CodeEmitterGK110::emitOUT(const Instruction *i)
 void
 CodeEmitterGK110::emitInterpMode(const Instruction *i)
 {
-   code[1] |= (i->ipa & 0x3) << 21; // TODO: INTERP_SAMPLEID
-   code[1] |= (i->ipa & 0xc) << (19 - 2);
+   code[1] |= i->ipa << 21; // TODO: INTERP_SAMPLEID
 }

 void
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_from_tgsi.cpp
@@ -790,8 +790,6 @@ bool Source::scanSource()
      info->prop.gp.instanceCount = 1; // default value
   }

-   info->io.viewportId = -1;
-
   info->immd.data = (uint32_t *)MALLOC(scan.immediate_count * 16);
   info->immd.type = (ubyte *)MALLOC(scan.immediate_count * sizeof(ubyte));

@@ -984,9 +982,6 @@ bool Source::scanDeclaration(const struct tgsi_full_declaration *decl)
         case TGSI_SEMANTIC_SAMPLEMASK:
            info->io.sampleMask = i;
            break;
-         case TGSI_SEMANTIC_VIEWPORT_INDEX:
-            info->io.viewportId = i;
-            break;
         default:
            break;
         }
@@ -1263,8 +1258,6 @@ private:
   Stack joinBBs;  // fork BB, for inserting join ops on ENDIF
   Stack loopBBs;  // loop headers
   Stack breakBBs; // end of / after loop
-
-   Value *viewport;
 };

 Symbol *
@@ -1562,16 +1555,8 @@ Converter::storeDst(const tgsi::Instruction::DstRegister dst, int c,
      mkOp2(OP_WRSV, TYPE_U32, NULL, dstToSym(dst, c), val);
   } else
   if (f == TGSI_FILE_OUTPUT && prog->getType() != Program::TYPE_FRAGMENT) {
-
-      if (ptr || (info->out[idx].mask & (1 << c))) {
-         /* Save the viewport index into a scratch register so that it can be
-            exported at EMIT time */
-         if (info->out[idx].sn == TGSI_SEMANTIC_VIEWPORT_INDEX &&
-             viewport != NULL)
-            mkOp1(OP_MOV, TYPE_U32, viewport, val);
-         else
-            mkStore(OP_EXPORT, TYPE_U32, dstToSym(dst, c), ptr, val);
-      }
+      if (ptr || (info->out[idx].mask & (1 << c)))
+         mkStore(OP_EXPORT, TYPE_U32, dstToSym(dst, c), ptr, val);
   } else
   if (f == TGSI_FILE_TEMPORARY ||
       f == TGSI_FILE_PREDICATE ||
@@ -2214,6 +2199,7 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
   case TGSI_OPCODE_IMUL_HI:
   case TGSI_OPCODE_UMUL_HI:
   case TGSI_OPCODE_OR:
+   case TGSI_OPCODE_POW:
   case TGSI_OPCODE_SHL:
   case TGSI_OPCODE_ISHR:
   case TGSI_OPCODE_USHR:
@@ -2268,11 +2254,6 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
      FOR_EACH_DST_ENABLED_CHANNEL(0, c, tgsi)
         mkOp1(OP_MOV, TYPE_U32, dst0[c], fetchSrc(0, c));
      break;
-   case TGSI_OPCODE_POW:
-      val0 = mkOp2v(op, TYPE_F32, getScratch(), fetchSrc(0, 0), fetchSrc(1, 0));
-      FOR_EACH_DST_ENABLED_CHANNEL(0, c, tgsi)
-         mkOp1(OP_MOV, TYPE_F32, dst0[c], val0);
-      break;
   case TGSI_OPCODE_EX2:
   case TGSI_OPCODE_LG2:
      val0 = mkOp1(op, TYPE_F32, getScratch(), fetchSrc(0, 0))->getDef(0);
@@ -2472,12 +2453,7 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
      break;
   case TGSI_OPCODE_KILL_IF:
      val0 = new_LValue(func, FILE_PREDICATE);
-      mask = 0;
      for (c = 0; c < 4; ++c) {
-         const int s = tgsi.getSrc(0).getSwizzle(c);
-         if (mask & (1 << s))
-            continue;
-         mask |= 1 << s;
         mkCmp(OP_SET, CC_LT, TYPE_F32, val0, TYPE_F32, fetchSrc(0, c), zero);
         mkOp(OP_DISCARD, TYPE_NONE, NULL)->setPredicate(CC_P, val0);
      }
@@ -2504,7 +2480,7 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
      break;
   case TGSI_OPCODE_TXB2:
   case TGSI_OPCODE_TXL2:
-      handleTEX(dst0, 2, 2, 0x10, 0x0f, 0x00, 0x00);
+      handleTEX(dst0, 2, 2, 0x10, 0x11, 0x00, 0x00);
      break;
   case TGSI_OPCODE_SAMPLE:
   case TGSI_OPCODE_SAMPLE_B:
@@ -2538,13 +2514,6 @@ Converter::handleInstruction(const struct tgsi_full_instruction *insn)
         mkCvt(OP_CVT, dstTy, dst0[c], srcTy, fetchSrc(0, c));
      break;
   case TGSI_OPCODE_EMIT:
-      /* export the saved viewport index */
-      if (viewport != NULL) {
-         Symbol *vpSym = mkSymbol(FILE_SHADER_OUTPUT, 0, TYPE_U32,
-                                  info->out[info->io.viewportId].slot[0] * 4);
-         mkStore(OP_EXPORT, TYPE_U32, vpSym, NULL, viewport);
-      }
-      /* fallthrough */
   case TGSI_OPCODE_ENDPRIM:
      // get vertex stream if specified (must be immediate)
      src0 = tgsi.srcCount() ?
@@ -2974,11 +2943,6 @@ Converter::run()
      mkOp1(OP_RCP, TYPE_F32, fragCoord[3], fragCoord[3]);
   }

-   if (info->io.viewportId >= 0)
-      viewport = getScratch();
-   else
-      viewport = NULL;
-
   for (ip = 0; ip < code->scan.num_instructions; ++ip) {
      if (!handleInstruction(&code->insns[ip]))
         return false;
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nv50.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nv50.cpp
@@ -37,25 +37,18 @@ namespace nv50_ir {
 //    ah*bl 00
 //
 // fffe0001 + fffe0001
-//
-// Note that this sort of splitting doesn't work for signed values, so we
-// compute the sign on those manually and then perform an unsigned multiply.
 static bool
 expandIntegerMUL(BuildUtil *bld, Instruction *mul)
 {
   const bool highResult = mul->subOp == NV50_IR_SUBOP_MUL_HIGH;

-   DataType fTy; // full type
-   switch (mul->sType) {
-   case TYPE_S32: fTy = TYPE_U32; break;
-   case TYPE_S64: fTy = TYPE_U64; break;
-   default: fTy = mul->sType; break;
-   }
-
-   DataType hTy; // half type
+   DataType fTy = mul->sType; // full type
+   DataType hTy;
   switch (fTy) {
+   case TYPE_S32: hTy = TYPE_S16; break;
   case TYPE_U32: hTy = TYPE_U16; break;
   case TYPE_U64: hTy = TYPE_U32; break;
+   case TYPE_S64: hTy = TYPE_S32; break;
   default:
      return false;
   }
@@ -66,25 +59,15 @@ expandIntegerMUL(BuildUtil *bld, Instruction *mul)

   bld->setPosition(mul, true);

-   Value *s[2];
   Value *a[2], *b[2];
+   Value *c[2];
   Value *t[4];
   for (int j = 0; j < 4; ++j)
      t[j] = bld->getSSA(fullSize);

-   s[0] = mul->getSrc(0);
-   s[1] = mul->getSrc(1);
-
-   if (isSignedType(mul->sType)) {
-      s[0] = bld->getSSA(fullSize);
-      s[1] = bld->getSSA(fullSize);
-      bld->mkOp1(OP_ABS, mul->sType, s[0], mul->getSrc(0));
-      bld->mkOp1(OP_ABS, mul->sType, s[1], mul->getSrc(1));
-   }
-
   // split sources into halves
-   i[0] = bld->mkSplit(a, halfSize, s[0]);
-   i[1] = bld->mkSplit(b, halfSize, s[1]);
+   i[0] = bld->mkSplit(a, halfSize, mul->getSrc(0));
+   i[1] = bld->mkSplit(b, halfSize, mul->getSrc(1));

   i[2] = bld->mkOp2(OP_MUL, fTy, t[0], a[0], b[1]);
   i[3] = bld->mkOp3(OP_MAD, fTy, t[1], a[1], b[0], t[0]);
@@ -92,76 +75,23 @@ expandIntegerMUL(BuildUtil *bld, Instruction *mul)
   i[4] = bld->mkOp3(OP_MAD, fTy, t[3], a[0], b[0], t[2]);

   if (highResult) {
-      Value *c[2];
-      Value *r[5];
+      Value *r[3];
      Value *imm = bld->loadImm(NULL, 1 << (halfSize * 8));
      c[0] = bld->getSSA(1, FILE_FLAGS);
      c[1] = bld->getSSA(1, FILE_FLAGS);
-      for (int j = 0; j < 5; ++j)
+      for (int j = 0; j < 3; ++j)
         r[j] = bld->getSSA(fullSize);

      i[8] = bld->mkOp2(OP_SHR, fTy, r[0], t[1], bld->mkImm(halfSize * 8));
      i[6] = bld->mkOp2(OP_ADD, fTy, r[1], r[0], imm);
-      bld->mkMov(r[3], r[0])->setPredicate(CC_NC, c[0]);
-      bld->mkOp2(OP_UNION, TYPE_U32, r[2], r[1], r[3]);
-      i[5] = bld->mkOp3(OP_MAD, fTy, r[4], a[1], b[1], r[2]);
+      bld->mkOp2(OP_UNION, TYPE_U32, r[2], r[1], r[0]);
+      i[5] = bld->mkOp3(OP_MAD, fTy, mul->getDef(0), a[1], b[1], r[2]);

      // set carry defs / sources
      i[3]->setFlagsDef(1, c[0]);
-      // actual result required in negative case, but ignored for
-      // unsigned. for some reason the compiler ends up dropping the whole
-      // instruction if the destination is unused but the flags are.
-      if (isSignedType(mul->sType))
-         i[4]->setFlagsDef(1, c[1]);
-      else
-         i[4]->setFlagsDef(0, c[1]);
+      i[4]->setFlagsDef(0, c[1]); // actual result not required, just the carry
      i[6]->setPredicate(CC_C, c[0]);
      i[5]->setFlagsSrc(3, c[1]);
-
-      if (isSignedType(mul->sType)) {
-         Value *cc[2];
-         Value *rr[7];
-         Value *one = bld->getSSA(fullSize);
-         bld->loadImm(one, 1);
-         for (int j = 0; j < 7; j++)
-            rr[j] = bld->getSSA(fullSize);
-
-         // NOTE: this logic uses predicates because splitting basic blocks is
-         // ~impossible during the SSA phase. The RA relies on a correlation
-         // between edge order and phi node sources.
-
-         // Set the sign of the result based on the inputs
-         bld->mkOp2(OP_XOR, fTy, NULL, mul->getSrc(0), mul->getSrc(1))
-            ->setFlagsDef(0, (cc[0] = bld->getSSA(1, FILE_FLAGS)));
-
-         // 1s complement of 64-bit value
-         bld->mkOp1(OP_NOT, fTy, rr[0], r[4])
-            ->setPredicate(CC_S, cc[0]);
-         bld->mkOp1(OP_NOT, fTy, rr[1], t[3])
-            ->setPredicate(CC_S, cc[0]);
-
-         // add to low 32-bits, keep track of the carry
-         Instruction *n = bld->mkOp2(OP_ADD, fTy, NULL, rr[1], one);
-         n->setPredicate(CC_S, cc[0]);
-         n->setFlagsDef(0, (cc[1] = bld->getSSA(1, FILE_FLAGS)));
-
-         // If there was a carry, add 1 to the upper 32 bits
-         // XXX: These get executed even if they shouldn't be
-         bld->mkOp2(OP_ADD, fTy, rr[2], rr[0], one)
-            ->setPredicate(CC_C, cc[1]);
-         bld->mkMov(rr[3], rr[0])
-            ->setPredicate(CC_NC, cc[1]);
-         bld->mkOp2(OP_UNION, fTy, rr[4], rr[2], rr[3]);
-
-         // Merge the results from the negative and non-negative paths
-         bld->mkMov(rr[5], rr[4])
-            ->setPredicate(CC_S, cc[0]);
-         bld->mkMov(rr[6], r[4])
-            ->setPredicate(CC_NS, cc[0]);
-         bld->mkOp2(OP_UNION, mul->sType, mul->getDef(0), rr[5], rr[6]);
-      } else {
-         bld->mkMov(mul->getDef(0), r[4]);
-      }
   } else {
      bld->mkMov(mul->getDef(0), t[3]);
   }
@@ -661,10 +591,6 @@ void NV50LoweringPreSSA::loadTexMsInfo(uint32_t off, Value **ms,
   Value *tmp = new_LValue(func, FILE_GPR);
   uint8_t b = prog->driver->io.resInfoCBSlot;
   off += prog->driver->io.suInfoBase;
-   if (prog->getType() > Program::TYPE_VERTEX)
-      off += 16 * 2 * 4;
-   if (prog->getType() > Program::TYPE_GEOMETRY)
-      off += 16 * 2 * 4;
   *ms_x = bld.mkLoadv(TYPE_U32, bld.mkSymbol(
                             FILE_MEMORY_CONST, b, TYPE_U32, off + 0), NULL);
   *ms_y = bld.mkLoadv(TYPE_U32, bld.mkSymbol(
@@ -797,16 +723,6 @@ NV50LoweringPreSSA::handleTXB(TexInstruction *i)
   const CondCode cc[4] = { CC_EQU, CC_S, CC_C, CC_O };
   int l, d;

-   // We can't actually apply bias *and* do a compare for a cube
-   // texture. Since the compare has to be done before the filtering, just
-   // drop the bias on the floor.
-   if (i->tex.target == TEX_TARGET_CUBE_SHADOW) {
-      i->op = OP_TEX;
-      i->setSrc(3, i->getSrc(4));
-      i->setSrc(4, NULL);
-      return handleTEX(i);
-   }
-
   handleTEX(i);
   Value *bias = i->getSrc(i->tex.target.getArgCount());
   if (bias->isUniform())
@@ -1289,11 +1205,8 @@ NV50LoweringPreSSA::checkPredicate(Instruction *insn)
   Value *pred = insn->getPredicate();
   Value *cdst;

-   // FILE_PREDICATE will simply be changed to FLAGS on conversion to SSA
-   if (!pred ||
-       pred->reg.file == FILE_FLAGS || pred->reg.file == FILE_PREDICATE)
+   if (!pred || pred->reg.file == FILE_FLAGS)
      return;
-
   cdst = bld.getSSA(1, FILE_FLAGS);

   bld.mkCmp(OP_SET, CC_NEU, insn->dType, cdst, insn->dType, bld.loadImm(NULL, 0), pred);
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_lowering_nvc0.cpp
@@ -26,7 +26,6 @@
 #include "codegen/nv50_ir_target_nvc0.h"

 #include <limits>
-#include <tr1/unordered_set>

 namespace nv50_ir {

@@ -149,8 +148,7 @@ private:
   bool insertTextureBarriers(Function *);
   inline bool insnDominatedBy(const Instruction *, const Instruction *) const;
   void findFirstUses(const Instruction *tex, const Instruction *def,
-                      std::list<TexUse>&,
-                      std::tr1::unordered_set<const Instruction *>&);
+                      std::list<TexUse>&);
   void findOverwritingDefs(const Instruction *tex, Instruction *insn,
                            const BasicBlock *term,
                            std::list<TexUse>&);
@@ -232,29 +230,15 @@ NVC0LegalizePostRA::findOverwritingDefs(const Instruction *texi,
 }

 void
-NVC0LegalizePostRA::findFirstUses(
-      const Instruction *texi,
-      const Instruction *insn,
-      std::list<TexUse> &uses,
-      std::tr1::unordered_set<const Instruction *>& visited)
+NVC0LegalizePostRA::findFirstUses(const Instruction *texi,
+                                  const Instruction *insn,
+                                  std::list<TexUse> &uses)
 {
   for (int d = 0; insn->defExists(d); ++d) {
      Value *v = insn->getDef(d);
      for (Value::UseIterator u = v->uses.begin(); u != v->uses.end(); ++u) {
         Instruction *usei = (*u)->getInsn();

-         // NOTE: In case of a loop that overwrites a value but never uses
-         // it, it can happen that we have a cycle of uses that consists only
-         // of phis and no-op moves and will thus cause an infinite loop here
-         // since these are not considered actual uses.
-         // The most obvious (and perhaps the only) way to prevent this is to
-         // remember which instructions we've already visited.
-
-         if (visited.find(usei) != visited.end())
-            continue;
-
-         visited.insert(usei);
-
         if (usei->op == OP_PHI || usei->op == OP_UNION) {
            // need a barrier before WAW cases
            for (int s = 0; usei->srcExists(s); ++s) {
@@ -269,11 +253,11 @@ NVC0LegalizePostRA::findFirstUses(
             usei->op == OP_PHI ||
             usei->op == OP_UNION) {
            // these uses don't manifest in the machine code
-            findFirstUses(texi, usei, uses, visited);
+            findFirstUses(texi, usei, uses);
         } else
         if (usei->op == OP_MOV && usei->getDef(0)->equals(usei->getSrc(0)) &&
             usei->subOp != NV50_IR_SUBOP_MOV_FINAL) {
-            findFirstUses(texi, usei, uses, visited);
+            findFirstUses(texi, usei, uses);
         } else {
            addTexUse(uses, usei, insn);
         }
@@ -329,10 +313,8 @@ NVC0LegalizePostRA::insertTextureBarriers(Function *fn)
   uses = new std::list<TexUse>[texes.size()];
   if (!uses)
      return false;
-   for (size_t i = 0; i < texes.size(); ++i) {
-      std::tr1::unordered_set<const Instruction *> visited;
-      findFirstUses(texes[i], texes[i], uses[i], visited);
-   }
+   for (size_t i = 0; i < texes.size(); ++i)
+      findFirstUses(texes[i], texes[i], uses[i]);

   // determine the barrier level at each use
   for (size_t i = 0; i < texes.size(); ++i) {
@@ -832,7 +814,6 @@ NVC0LoweringPass::handleManualTXD(TexInstruction *i)
   Value *zero = bld.loadImm(bld.getSSA(), 0);
   int l, c;
   const int dim = i->tex.target.getDim();
-   const int array = i->tex.target.isArray();

   i->op = OP_TEX; // no need to clone dPdx/dPdy later

@@ -843,7 +824,7 @@ NVC0LoweringPass::handleManualTXD(TexInstruction *i)
   for (l = 0; l < 4; ++l) {
      // mov coordinates from lane l to all lanes
      for (c = 0; c < dim; ++c)
-         bld.mkQuadop(0x00, crd[c], l, i->getSrc(c + array), zero);
+         bld.mkQuadop(0x00, crd[c], l, i->getSrc(c), zero);
      // add dPdx from lane l to lanes dx
      for (c = 0; c < dim; ++c)
         bld.mkQuadop(qOps[l][0], crd[c], l, i->dPdx[c].get(), crd[c]);
@@ -853,7 +834,7 @@ NVC0LoweringPass::handleManualTXD(TexInstruction *i)
      // texture
      bld.insert(tex = cloneForward(func, i));
      for (c = 0; c < dim; ++c)
-         tex->setSrc(c + array, crd[c]);
+         tex->setSrc(c, crd[c]);
      // save results
      for (c = 0; i->defExists(c); ++c) {
         Instruction *mov;
@@ -889,8 +870,7 @@ NVC0LoweringPass::handleTXD(TexInstruction *txd)
   if (dim > 2 ||
       txd->tex.target.isCube() ||
       arg > 4 ||
-       txd->tex.target.isShadow() ||
-       txd->tex.useOffsets)
+       txd->tex.target.isShadow())
      return handleManualTXD(txd);

   for (int c = 0; c < dim; ++c) {
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_peephole.cpp
@@ -187,8 +187,7 @@ LoadPropagation::checkSwapSrc01(Instruction *insn)
      return;
   }

-   if (insn->op == OP_SET || insn->op == OP_SET_AND ||
-       insn->op == OP_SET_OR || insn->op == OP_SET_XOR)
+   if (insn->op == OP_SET)
      insn->asCmp()->setCond = reverseCondCode(insn->asCmp()->setCond);
   else
   if (insn->op == OP_SLCT)
@@ -425,17 +424,7 @@ ConstantFolding::expr(Instruction *i,
      case TYPE_F32: res.data.f32 = a->data.f32 * b->data.f32; break;
      case TYPE_F64: res.data.f64 = a->data.f64 * b->data.f64; break;
      case TYPE_S32:
-         if (i->subOp == NV50_IR_SUBOP_MUL_HIGH) {
-            res.data.s32 = ((int64_t)a->data.s32 * b->data.s32) >> 32;
-            break;
-         }
-         /* fallthrough */
-      case TYPE_U32:
-         if (i->subOp == NV50_IR_SUBOP_MUL_HIGH) {
-            res.data.u32 = ((uint64_t)a->data.u32 * b->data.u32) >> 32;
-            break;
-         }
-         res.data.u32 = a->data.u32 * b->data.u32; break;
+      case TYPE_U32: res.data.u32 = a->data.u32 * b->data.u32; break;
      default:
         return;
      }
@@ -560,14 +549,9 @@ ConstantFolding::expr(Instruction *i,
      ImmediateValue src0;
      if (i->src(0).getImmediate(src0))
         expr(i, src0, *i->getSrc(1)->asImm());
-      if (i->saturate && !prog->getTarget()->isSatSupported(i)) {
-         bld.setPosition(i, false);
-         i->setSrc(1, bld.loadImm(NULL, res.data.u32));
-      }
   } else {
-      i->op = i->saturate ? OP_SAT : OP_MOV; /* SAT handled by unary() */
+      i->op = OP_MOV;
   }
-   i->subOp = 0;
 }

 void
@@ -617,7 +601,6 @@ ConstantFolding::unary(Instruction *i, const ImmediateValue &imm)
   switch (i->op) {
   case OP_NEG: res.data.f32 = -imm.reg.data.f32; break;
   case OP_ABS: res.data.f32 = fabsf(imm.reg.data.f32); break;
-   case OP_SAT: res.data.f32 = CLAMP(imm.reg.data.f32, 0.0f, 1.0f); break;
   case OP_RCP: res.data.f32 = 1.0f / imm.reg.data.f32; break;
   case OP_RSQ: res.data.f32 = 1.0f / sqrtf(imm.reg.data.f32); break;
   case OP_LG2: res.data.f32 = log2f(imm.reg.data.f32); break;
@@ -707,41 +690,12 @@ ConstantFolding::opnd(Instruction *i, ImmediateValue &imm0, int s)
 {
   const int t = !s;
   const operation op = i->op;
-   Instruction *newi = i;

   switch (i->op) {
   case OP_MUL:
      if (i->dType == TYPE_F32)
         tryCollapseChainedMULs(i, s, imm0);

-      if (i->subOp == NV50_IR_SUBOP_MUL_HIGH) {
-         assert(!isFloatType(i->sType));
-         if (imm0.isInteger(1) && i->dType == TYPE_S32) {
-            bld.setPosition(i, false);
-            // Need to set to the sign value, which is a compare.
-            newi = bld.mkCmp(OP_SET, CC_LT, TYPE_S32, i->getDef(0),
-                             TYPE_S32, i->getSrc(t), bld.mkImm(0));
-            delete_Instruction(prog, i);
-         } else if (imm0.isInteger(0) || imm0.isInteger(1)) {
-            // The high bits can't be set in this case (either mul by 0 or
-            // unsigned by 1)
-            i->op = OP_MOV;
-            i->subOp = 0;
-            i->setSrc(0, new_ImmediateValue(prog, 0u));
-            i->src(0).mod = Modifier(0);
-            i->setSrc(1, NULL);
-         } else if (!imm0.isNegative() && imm0.isPow2()) {
-            // Translate into a shift
-            imm0.applyLog2();
-            i->op = OP_SHR;
-            i->subOp = 0;
-            imm0.reg.data.u32 = 32 - imm0.reg.data.u32;
-            i->setSrc(0, i->getSrc(t));
-            i->src(0).mod = i->src(t).mod;
-            i->setSrc(1, new_ImmediateValue(prog, imm0.reg.data.u32));
-            i->src(1).mod = 0;
-         }
-      } else
      if (imm0.isInteger(0)) {
         i->op = OP_MOV;
         i->setSrc(0, new_ImmediateValue(prog, 0u));
@@ -832,7 +786,7 @@ ConstantFolding::opnd(Instruction *i, ImmediateValue &imm0, int s)
         else
            tA = tB;
         tB = s ? bld.getSSA() : i->getDef(0);
-         newi = bld.mkOp2(OP_ADD, TYPE_U32, tB, mul->getDef(0), tA);
+         bld.mkOp2(OP_ADD, TYPE_U32, tB, mul->getDef(0), tA);
         if (s)
            bld.mkOp2(OP_SHR, TYPE_U32, i->getDef(0), tB, bld.mkImm(s));

@@ -864,7 +818,7 @@ ConstantFolding::opnd(Instruction *i, ImmediateValue &imm0, int s)
         tA = bld.getSSA();
         bld.mkCmp(OP_SET, CC_LT, TYPE_S32, tA, TYPE_S32, i->getSrc(0), bld.mkImm(0));
         tD = (d < 0) ? bld.getSSA() : i->getDef(0)->asLValue();
-         newi = bld.mkOp2(OP_SUB, TYPE_U32, tD, tB, tA);
+         bld.mkOp2(OP_SUB, TYPE_U32, tD, tB, tA);
         if (d < 0)
            bld.mkOp1(OP_NEG, TYPE_S32, i->getDef(0), tB);

@@ -928,7 +882,6 @@ ConstantFolding::opnd(Instruction *i, ImmediateValue &imm0, int s)

   case OP_ABS:
   case OP_NEG:
-   case OP_SAT:
   case OP_LG2:
   case OP_RCP:
   case OP_SQRT:
@@ -943,7 +896,7 @@ ConstantFolding::opnd(Instruction *i, ImmediateValue &imm0, int s)
   default:
      return;
   }
-   if (newi->op != op)
+   if (i->op != op)
      foldCount++;
 }

--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_ra.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_ra.cpp
@@ -998,9 +998,7 @@ GCRA::doCoalesce(ArrayList& insns, unsigned int mask)
      case OP_TXQ:
      case OP_TXD:
      case OP_TXG:
-      case OP_TXLQ:
      case OP_TEXCSAA:
-      case OP_TEXPREP:
         if (!(mask & JOIN_MASK_TEX))
            break;
         for (c = 0; insn->srcExists(c) && c != insn->predSrc; ++c)
@@ -1654,10 +1652,6 @@ RegAlloc::execFunc()
           ret && i <= func->loopNestingBound;
           sequence = func->cfg.nextSequence(), ++i)
         ret = buildLiveSets(BasicBlock::get(func->cfg.getRoot()));
-      // reset marker
-      for (ArrayList::Iterator bi = func->allBBlocks.iterator();
-           !bi.end(); bi.next())
-         BasicBlock::get(bi)->liveSet.marker = false;
      if (!ret)
         break;
      func->orderInstructions(this->insns);
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nv50.cpp
@@ -331,8 +331,6 @@ TargetNV50::insnCanLoad(const Instruction *i, int s,
         return false;
      if (sf == FILE_IMMEDIATE)
         return false;
-      if (i->subOp == NV50_IR_SUBOP_MUL_HIGH && sf == FILE_MEMORY_CONST)
-         return false;
      ldSize = 2;
   } else {
      ldSize = typeSizeof(ld->dType);
@@ -448,7 +446,7 @@ TargetNV50::isModSupported(const Instruction *insn, int s, Modifier mod) const
         return false;
      }
   }
-   if (s >= 3)
+   if (s > 3)
      return false;
   return (mod & Modifier(opInfo[insn->op].srcMods[s])) == mod;
 }
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nvc0.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_target_nvc0.cpp
@@ -417,7 +417,7 @@ TargetNVC0::isModSupported(const Instruction *insn, int s, Modifier mod) const
         return false;
      }
   }
-   if (s >= 3)
+   if (s > 3)
      return false;
   return (mod & Modifier(opInfo[insn->op].srcMods[s])) == mod;
 }
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_util.cpp
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_util.cpp
@@ -254,9 +254,7 @@ bool BitSet::resize(unsigned int nBits)
      return false;
   }
   if (n > p)
-      memset(&data[p], 0, (n - p) * 4);
-   if (nBits < size && (nBits % 32))
-      data[(nBits + 31) / 32 - 1] &= (1 << (nBits % 32)) - 1;
+      memset(&data[4 * p + 4], 0, (n - p) * 4);

   size = nBits;
   return true;
@@ -276,8 +274,8 @@ bool BitSet::allocate(unsigned int nBits, bool zero)
   if (zero)
      memset(data, 0, (size + 7) / 8);
   else
-   if (size % 32) // clear unused bits (e.g. for popCount)
-      data[(size + 31) / 32 - 1] &= (1 << (size % 32)) - 1;
+   if (nBits)
+      data[(size + 31) / 32 - 1] = 0; // clear unused bits (e.g. for popCount)

   return data;
 }
--- a/src/gallium/drivers/nouveau/codegen/nv50_ir_util.h
+++ b/src/gallium/drivers/nouveau/codegen/nv50_ir_util.h
@@ -484,7 +484,6 @@ public:
         FREE(data);
   }

-   // allocate will keep old data iff size is unchanged
   bool allocate(unsigned int nBits, bool zero);
   bool resize(unsigned int nBits); // keep old data, zero additional bits

--- a/src/gallium/drivers/nouveau/nouveau_vp3_video.h
+++ b/src/gallium/drivers/nouveau/nouveau_vp3_video.h
@@ -39,8 +39,6 @@ struct nouveau_vp3_video_buffer {
 #define VP_OFFSET 0x200
 #define COMM_OFFSET 0x500

-#define NOUVEAU_VP3_BSP_RESERVED_SIZE 0x700
-
 #define NOUVEAU_VP3_DEBUG_FENCE 0

 #if NOUVEAU_VP3_DEBUG_FENCE
--- a/src/gallium/drivers/nouveau/nouveau_vp3_video_vp.c
+++ b/src/gallium/drivers/nouveau/nouveau_vp3_video_vp.c
@@ -78,10 +78,10 @@ struct mpeg4_picparm_vp {
 	uint8_t top_field_first; // bool, written to vuc

 	uint8_t pad4[3]; // 59, 5a, 5b, contains garbage on blob
+	uint32_t pad5[0x10]; // 5c...9c non-inclusive, but WHY?

-	uint32_t intra[0x10]; // 5c
-	uint32_t non_intra[0x10]; // 9c
-	uint32_t pad5[0x10]; // bc what does this do?
+	uint32_t intra[0x10]; // 9c
+	uint32_t non_intra[0x10]; // bc
 	// udc..uff pad?
 };

@@ -196,15 +196,11 @@ nouveau_vp3_handle_references(struct nouveau_vp3_decoder *dec, struct nouveau_vp
   /* Try to find a real empty spot first, there should be one..
    */
   for (i = 0; i < dec->base.max_references + 1; ++i) {
-      if (dec->refs[i].vidbuf == target) {
+      if (dec->refs[i].last_used != seq) {
         empty_spot = i;
         break;
-      } else if (!dec->refs[i].last_used) {
-         empty_spot = i;
-      } else if (empty_spot == ~0U && dec->refs[i].last_used != seq)
-         empty_spot = i;
+      }
   }
-
   assert(empty_spot < dec->base.max_references+1);
   dec->refs[empty_spot].last_used = seq;
 //   debug_printf("Kicked %p to add %p to slot %i\n", dec->refs[empty_spot].vidbuf, target, empty_spot);
@@ -271,6 +267,7 @@ nouveau_vp3_fill_picparm_mpeg4_vp(struct nouveau_vp3_decoder *dec,
 {
   struct mpeg4_picparm_vp pic_vp_stub = {}, *pic_vp = &pic_vp_stub;
   uint32_t ring, ret = 0x01014; // !async_shutdown << 16 | watchdog << 12 | irq_record << 4 | unk;
+   assert(!(dec->base.width & 0xf));
   *is_ref = desc->vop_coding_type <= 1;

   pic_vp->width = dec->base.width;
@@ -466,45 +463,14 @@ void nouveau_vp3_vp_caps(struct nouveau_vp3_decoder *dec, union pipe_desc desc,
   case PIPE_VIDEO_FORMAT_MPEG12:
      *caps = nouveau_vp3_fill_picparm_mpeg12_vp(dec, desc.mpeg12, refs, is_ref, vp);
      nouveau_vp3_handle_references(dec, refs, dec->fence_seq, target);
-      switch (desc.mpeg12->picture_structure) {
-      case PIPE_MPEG12_PICTURE_STRUCTURE_FIELD_TOP:
-         dec->refs[target->valid_ref].decoded_top = 1;
-         break;
-      case PIPE_MPEG12_PICTURE_STRUCTURE_FIELD_BOTTOM:
-         dec->refs[target->valid_ref].decoded_bottom = 1;
-         break;
-      default:
-         dec->refs[target->valid_ref].decoded_top = 1;
-         dec->refs[target->valid_ref].decoded_bottom = 1;
-         break;
-      }
      return;
   case PIPE_VIDEO_FORMAT_MPEG4:
      *caps = nouveau_vp3_fill_picparm_mpeg4_vp(dec, desc.mpeg4, refs, is_ref, vp);
      nouveau_vp3_handle_references(dec, refs, dec->fence_seq, target);
-      // XXX: Correct?
-      if (!desc.mpeg4->interlaced) {
-         dec->refs[target->valid_ref].decoded_top = 1;
-         dec->refs[target->valid_ref].decoded_bottom = 1;
-      } else if (desc.mpeg4->top_field_first) {
-         if (!dec->refs[target->valid_ref].decoded_top)
-            dec->refs[target->valid_ref].decoded_top = 1;
-         else
-            dec->refs[target->valid_ref].decoded_bottom = 1;
-      } else {
-         if (!dec->refs[target->valid_ref].decoded_bottom)
-            dec->refs[target->valid_ref].decoded_bottom = 1;
-         else
-            dec->refs[target->valid_ref].decoded_top = 1;
-      }
      return;
   case PIPE_VIDEO_FORMAT_VC1: {
      *caps = nouveau_vp3_fill_picparm_vc1_vp(dec, desc.vc1, refs, is_ref, vp);
      nouveau_vp3_handle_references(dec, refs, dec->fence_seq, target);
-      if (desc.vc1->frame_coding_mode == 3)
-         debug_printf("Field-Interlaced possibly incorrectly handled\n");
-      dec->refs[target->valid_ref].decoded_top = 1;
-      dec->refs[target->valid_ref].decoded_bottom = 1;
      return;
   }
   case PIPE_VIDEO_FORMAT_MPEG4_AVC: {
--- a/src/gallium/drivers/nouveau/nv30/nv30_context.c
+++ b/src/gallium/drivers/nouveau/nv30/nv30_context.c
@@ -165,9 +165,6 @@ nv30_context_destroy(struct pipe_context *pipe)
   if (nv30->draw)
      draw_destroy(nv30->draw);

-   if (nv30->screen->base.pushbuf->user_priv == &nv30->bufctx)
-      nv30->screen->base.pushbuf->user_priv = NULL;
-
   nouveau_bufctx_del(&nv30->bufctx);

   if (nv30->screen->cur_ctx == nv30)
--- a/src/gallium/drivers/nouveau/nv30/nv30_screen.c
+++ b/src/gallium/drivers/nouveau/nv30/nv30_screen.c
@@ -325,12 +325,6 @@ nv30_screen_destroy(struct pipe_screen *pscreen)
      nouveau_fence_ref(NULL, &screen->base.fence.current);
   }

-   nouveau_bo_ref(NULL, &screen->notify);
-
-   nouveau_heap_destroy(&screen->query_heap);
-   nouveau_heap_destroy(&screen->vp_exec_heap);
-   nouveau_heap_destroy(&screen->vp_data_heap);
-
   nouveau_object_del(&screen->query);
   nouveau_object_del(&screen->fence);
   nouveau_object_del(&screen->ntfy);
--- a/src/gallium/drivers/nouveau/nv30/nv30_state.c
+++ b/src/gallium/drivers/nouveau/nv30/nv30_state.c
@@ -23,7 +23,6 @@
 *
 */

-#include "util/u_format.h"
 #include "util/u_helpers.h"
 #include "util/u_inlines.h"

@@ -361,22 +360,6 @@ nv30_set_framebuffer_state(struct pipe_context *pipe,

    nv30->framebuffer = *fb;
    nv30->dirty |= NV30_NEW_FRAMEBUFFER;
-
-   /* Hardware can't handle different swizzled-ness or different blocksizes
-    * for zs and cbufs. If both are supplied and something doesn't match,
-    * blank out the zs for now so that at least *some* rendering can occur.
-    */
-    if (fb->nr_cbufs > 0 && fb->zsbuf) {
-       struct nv30_miptree *color_mt = nv30_miptree(fb->cbufs[0]->texture);
-       struct nv30_miptree *zeta_mt = nv30_miptree(fb->zsbuf->texture);
-
-       if (color_mt->swizzled != zeta_mt->swizzled ||
-           (util_format_get_blocksize(fb->zsbuf->format) > 2) !=
-           (util_format_get_blocksize(fb->cbufs[0]->format) > 2)) {
-          nv30->framebuffer.zsbuf = NULL;
-          debug_printf("Mismatched color and zeta formats, ignoring zeta.\n");
-       }
-    }
 }

 static void
--- a/src/gallium/drivers/nouveau/nv30/nvfx_fragprog.c
+++ b/src/gallium/drivers/nouveau/nv30/nvfx_fragprog.c
@@ -1225,7 +1225,6 @@ out:
   if(fpc)
   {
      FREE(fpc->r_temp);
-      FREE(fpc->r_imm);
      util_dynarray_fini(&fpc->if_stack);
      util_dynarray_fini(&fpc->label_relocs);
      util_dynarray_fini(&fpc->imm_data);
--- a/src/gallium/drivers/nouveau/nv50/nv50_context.c
+++ b/src/gallium/drivers/nouveau/nv50/nv50_context.c
@@ -61,7 +61,7 @@ static void
 nv50_memory_barrier(struct pipe_context *pipe, unsigned flags)
 {
   struct nv50_context *nv50 = nv50_context(pipe);
-   int i, s;
+   int i;

   if (flags & PIPE_BARRIER_MAPPED_BUFFER) {
      for (i = 0; i < nv50->num_vtxbufs; ++i) {
@@ -74,26 +74,6 @@ nv50_memory_barrier(struct pipe_context *pipe, unsigned flags)
      if (nv50->idxbuf.buffer &&
          nv50->idxbuf.buffer->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT)
         nv50->base.vbo_dirty = TRUE;
-
-      for (s = 0; s < 3 && !nv50->cb_dirty; ++s) {
-         uint32_t valid = nv50->constbuf_valid[s];
-
-         while (valid && !nv50->cb_dirty) {
-            const unsigned i = ffs(valid) - 1;
-            struct pipe_resource *res;
-
-            valid &= ~(1 << i);
-            if (nv50->constbuf[s][i].user)
-               continue;
-
-            res = nv50->constbuf[s][i].u.buf;
-            if (!res)
-               continue;
-
-            if (res->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT)
-               nv50->cb_dirty = TRUE;
-         }
-      }
   }
 }

@@ -142,9 +122,12 @@ nv50_destroy(struct pipe_context *pipe)
 {
   struct nv50_context *nv50 = nv50_context(pipe);

-   if (nv50_context_screen(nv50)->cur_ctx == nv50)
+   if (nv50_context_screen(nv50)->cur_ctx == nv50) {
+      nv50->base.pushbuf->kick_notify = NULL;
      nv50_context_screen(nv50)->cur_ctx = NULL;
-   nouveau_pushbuf_bufctx(nv50->base.pushbuf, NULL);
+      nouveau_pushbuf_bufctx(nv50->base.pushbuf, NULL);
+   }
+   /* need to flush before destroying the bufctx */
   nouveau_pushbuf_kick(nv50->base.pushbuf, nv50->base.pushbuf->channel);

   nv50_context_unreference_resources(nv50);
@@ -273,14 +256,7 @@ nv50_create(struct pipe_screen *pscreen, void *priv)
   nv50->base.screen    = &screen->base;
   nv50->base.copy_data = nv50_m2mf_copy_linear;
   nv50->base.push_data = nv50_sifc_linear_u8;
-   /* FIXME: Make it possible to use this again. The problem is that there is
-    * some clever logic in the card that allows for multiple renders to happen
-    * when there are only constbuf changes. However that relies on the
-    * constbuf updates happening to the right constbuf slots. Currently
-    * implementation just makes it go through a separate slot which doesn't
-    * properly update the right constbuf data.
   nv50->base.push_cb   = nv50_cb_push;
-    */

   nv50->screen = screen;
   pipe->screen = pscreen;
--- a/src/gallium/drivers/nouveau/nv50/nv50_context.h
+++ b/src/gallium/drivers/nouveau/nv50/nv50_context.h
@@ -78,16 +78,16 @@
 /* 8 user clip planes, at 4 32-bit floats each */
 #define NV50_CB_AUX_UCP_OFFSET    0x0000
 #define NV50_CB_AUX_UCP_SIZE      (8 * 4 * 4)
-/* 16 textures * 3 shaders, each with ms_x, ms_y u32 pairs */
+/* 256 textures, each with ms_x, ms_y u32 pairs */
 #define NV50_CB_AUX_TEX_MS_OFFSET 0x0080
-#define NV50_CB_AUX_TEX_MS_SIZE   (16 * 3 * 2 * 4)
+#define NV50_CB_AUX_TEX_MS_SIZE   (256 * 2 * 4)
 /* For each MS level (4), 8 sets of 32-bit integer pairs sample offsets */
-#define NV50_CB_AUX_MS_OFFSET     0x200
+#define NV50_CB_AUX_MS_OFFSET     0x880
 #define NV50_CB_AUX_MS_SIZE       (4 * 8 * 4 * 2)
 /* Sample position pairs for the current output MS level */
-#define NV50_CB_AUX_SAMPLE_OFFSET 0x300
+#define NV50_CB_AUX_SAMPLE_OFFSET 0x980
 #define NV50_CB_AUX_SAMPLE_OFFSET_SIZE (4 * 8 * 2)
-/* next spot: 0x340 */
+/* next spot: 0x9c0 */
 /* 4 32-bit floats for the vertex runout, put at the end */
 #define NV50_CB_AUX_RUNOUT_OFFSET (NV50_CB_AUX_SIZE - 0x10)

@@ -106,7 +106,6 @@ struct nv50_context {
   struct nouveau_bufctx *bufctx;

   uint32_t dirty;
-   boolean cb_dirty;

   struct {
      uint32_t instance_elts; /* bitmask of per-instance elements */
--- a/src/gallium/drivers/nouveau/nv50/nv50_query.c
+++ b/src/gallium/drivers/nouveau/nv50/nv50_query.c
@@ -332,7 +332,7 @@ nv50_render_condition(struct pipe_context *pipe,
   nv50->cond_cond = condition;
   nv50->cond_mode = mode;

-   PUSH_SPACE(push, 9);
+   PUSH_SPACE(push, 6);

   if (!pq) {
      BEGIN_NV04(push, NV50_3D(COND_MODE), 1);
@@ -351,10 +351,6 @@ nv50_render_condition(struct pipe_context *pipe,
   PUSH_DATAh(push, q->bo->offset + q->offset);
   PUSH_DATA (push, q->bo->offset + q->offset);
   PUSH_DATA (push, NV50_3D_COND_MODE_RES_NON_ZERO);
-
-   BEGIN_NV04(push, NV50_2D(COND_ADDRESS_HIGH), 2);
-   PUSH_DATAh(push, q->bo->offset + q->offset);
-   PUSH_DATA (push, q->bo->offset + q->offset);
 }

 void
--- a/Show More
+++ b/Show More
Author	SHA1	Message	Date
Ian Romanick	2e3ded0f44	mesa: Bump version to 10.2-rc2 Signed-off-by: Ian Romanick <ian.d.romanick@intel.com>	2014-05-09 20:02:02 -07:00
Emil Velikov	fbc15d34c3	glx/tests: Partially revert commit `51e3569573` C++ does not support designated initializers, thus compilation is not guaranteed to succeed. Surprisingly gcc 4.6.3 fails to build the code, while version 4.9.0 compiles it without a hitch. Cc: "10.2" <mesa-stable@lists.freedesktop.org> Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=78403 Signed-off-by: Emil Velikov <emil.l.velikov@gmail.com> Tested-by: Vinson Lee <vlee@freedesktop.org> (cherry picked from commit `326b8e253e`)	2014-05-09 18:33:27 -07:00
Emil Velikov	f6b31ce57d	configure: error out if building GBM without dri Both backends require --enable-dri, and building an empty libgbm makes little to no sense. Error out at configure to prevent the user from shooting themselves in the foot. Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=78225 Cc: "10.1 10.2" <mesa-stable@lists.freedesktop.org> Signed-off-by: Emil Velikov <emil.l.velikov@gmail.com> Reviewed-by: Kenneth Graunke <kenneth@whitecape.org> (cherry picked from commit `e477d12c33`)	2014-05-09 18:33:22 -07:00
Kenneth Graunke	441a8ea491	i965: Fix GPU hangs on Broadwell in shaders with some control flow. According to the documentation, we need to set the source 0 register type to IMM for flow control instructions that have both JIP and UIP. Fixes GPU hangs in approximately 10 Piglit tests, 5 es3conform tests, Unigine Crypt, a WebGL raytracer demo, and several Steam titles. Cc: "10.2" <mesa-stable@lists.freedesktop.org> Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=75478 Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=75878 Bugzilla: https://bugs.freedesktop.org/show_bug.cgi?id=76939 Signed-off-by: Kenneth Graunke <kenneth@whitecape.org> Tested-by: Topi Pohjolainen <topi.pohjolainen@intel.com> Tested-by: Kristian Høgsberg <krh@bitplanet.net> Reviewed-by: Jordan Justen <jordan.l.justen@intel.com> Reviewed-by: Matt Turner <mattst88@gmail.com> (cherry picked from commit `9584959123`)	2014-05-09 18:32:57 -07:00
Tom Stellard	3d10bc0e5f	radeonsi: Enable geometry shaders with LLVM 3.4.1 Reviewed-by: Michel Dänzer <michel.daenzer@amd.com> CC: "10.1 10.2" <mesa-stable@lists.freedesktop.org> (cherry picked from commit `93c2ebbd83`)	2014-05-09 18:32:39 -07:00
Tom Stellard	559fc2d706	configure.ac: Add LLVM_VERSION_PATCH to DEFINES Reviewed-by: Michel Dänzer <michel.daenzer@amd.com> CC: "10.1 10.2" <mesa-stable@lists.freedesktop.org> (cherry picked from commit `c5d0008325`)	2014-05-09 18:31:29 -07:00
Thomas Hellstrom	e216ce1795	st/xa: Fix performance regression introduced by commit "Cache render target surface" The mentioned commit has the nasty side-effect of turning off accelerated copies. Cc: "10.1 10.2" <mesa-stable@lists.freedesktop.org> Signed-off-by: Thomas Hellstrom <thellstrom@vmware.com> Reviewed-by: Jakob Bornecrantz <jakob@vmware.com> Reviewed-by: Rob Clark <robdclark@gmail.com> (cherry picked from commit `9306b7c171`)	2014-05-09 18:31:07 -07:00
Tom Stellard	de219af04c	clover: Destory pipe_screen when device does not support compute v2 v2: - Make sure screen was successfully created before destroying it. Cc: "10.2" <mesa-stable@lists.freedesktop.org> Reviewed-by: Francisco Jerez <currojerez@riseup.net> (cherry picked from commit `c5f0c98c49`)	2014-05-09 18:31:03 -07:00
Tom Stellard	6be3f110e9	pipe-loader: Don't destroy the winsys in the sw loader The screen takes ownership of the winsys, and is responsible for destroying it. Users of pipe-loader should make sure they destory and screens they've created to avoid memory leaks. This fixes a crash in clover introduced by `ce6c17c083` where the pipe-loader was destroying the winsys while a screen was still using it. Cc: "10.2" <mesa-stable@lists.freedesktop.org> Reviewed-by: Emil Velikov <emil.l.velikov@gmail.com> (cherry picked from commit `c650033b86`)	2014-05-09 18:30:38 -07:00
Roland Scheidegger	c469c8daab	draw: do not use draw_get_option_use_llvm() inside draw execution paths `1c73e919a4` made it possible to not allocate the tgsi machine if llvm was used. However, draw_get_option_use_llvm() is not reliable after draw context creation, since drivers can explicitly request a non-llvm draw context even if draw_get_option_use_llvm() would return true (and softpipe does just that) which leads to crashes. Thus use draw->llvm to determine if we're using llvm or not instead (and make draw->llvm available even if HAVE_LLVM is false so we don't have to put even more ifdefs). Cc: "10.2" <mesa-stable@lists.freedesktop.org> Reviewed-by: Brian Paul <brianp@vmware.com> (cherry picked from commit `9af68e9b1d`)	2014-05-09 18:29:11 -07:00
Kenneth Graunke	0b3924b41e	i965: Fix depth (array slices) computation for 1D_ARRAY render targets. 1D array targets store the number of slices in the Height field. Fixes Piglit's spec/!OpenGL 3.2/layered-rendering/clear-color-all-types 1d_array single_level, at least when used with Meta clears. Cc: "10.2 10.1 10.0" <mesa-stable@lists.freedesktop.org> Signed-off-by: Kenneth Graunke <kenneth@whitecape.org> Reviewed-by: Jordan Justen <jordan.l.justen@intel.com> (cherry picked from commit `e6967270c7`)	2014-05-09 18:28:34 -07:00