Add a test for reading tiled objects with pread.
authorEric Anholt <eric@anholt.net>
Tue, 7 Apr 2009 23:21:16 +0000 (16:21 -0700)
committerEric Anholt <eric@anholt.net>
Wed, 8 Apr 2009 02:06:36 +0000 (19:06 -0700)
.gitignore
tests/Makefile.am
tests/gem_tiled_pread.c [new file with mode: 0644]

index aea96c1..6511a95 100644 (file)
@@ -41,6 +41,7 @@ tests/gem_mmap
 tests/gem_pread_after_blit
 tests/gem_readwrite
 tests/gem_tiled_blits
+tests/gem_tiled_pread
 tools/intel_gpu_dump
 tools/intel_gpu_top
 tools/intel_stepping
index a3d1c83..823ee65 100644 (file)
@@ -6,6 +6,7 @@ TESTS = getversion \
        gem_readwrite \
        gem_mmap \
        gem_pread_after_blit \
+       gem_tiled_pread \
        gem_tiled_blits
 
 EXTRA_PROGRAMS = $(TESTS)
diff --git a/tests/gem_tiled_pread.c b/tests/gem_tiled_pread.c
new file mode 100644 (file)
index 0000000..a6b99bd
--- /dev/null
@@ -0,0 +1,265 @@
+/*
+ * Copyright © 2009 Intel Corporation
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
+ * IN THE SOFTWARE.
+ *
+ * Authors:
+ *    Eric Anholt <eric@anholt.net>
+ *
+ */
+
+/** @file gem_tiled_pread.c
+ *
+ * This is a test of pread's behavior on tiled objects with respect to the
+ * reported swizzling value.
+ *
+ * The goal is to exercise the slow_bit17_copy path for reading on bit17
+ * machines, but will also be useful for catching swizzling value bugs on
+ * other systems.
+ */
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <string.h>
+#include <assert.h>
+#include <fcntl.h>
+#include <inttypes.h>
+#include <errno.h>
+#include <sys/stat.h>
+#include <sys/time.h>
+#include "drm.h"
+#include "i915_drm.h"
+#include "drmtest.h"
+#include "intel_bufmgr.h"
+#include "intel_batchbuffer.h"
+#include "intel_gpu_tools.h"
+
+static drm_intel_bufmgr *bufmgr;
+struct intel_batchbuffer *batch;
+static const int width = 512, height = 512;
+static const int size = 1024 * 1024;
+
+#define PAGE_SIZE 4096
+
+static void
+copy_bo(drm_intel_bo *dst_bo, drm_intel_bo *src_bo)
+{
+       uint32_t src_tiling, dst_tiling, swizzle;
+       uint32_t src_pitch, dst_pitch;
+       uint32_t cmd_bits = 0;
+
+       drm_intel_bo_get_tiling(src_bo, &src_tiling, &swizzle);
+       drm_intel_bo_get_tiling(dst_bo, &dst_tiling, &swizzle);
+
+       src_pitch = width * 4;
+       if (IS_965(devid) && src_tiling != I915_TILING_NONE) {
+               src_pitch /= 4;
+               cmd_bits |= XY_SRC_COPY_BLT_SRC_TILED;
+       }
+
+       dst_pitch = width * 4;
+       if (IS_965(devid) && dst_tiling != I915_TILING_NONE) {
+               dst_pitch /= 4;
+               cmd_bits |= XY_SRC_COPY_BLT_DST_TILED;
+       }
+
+       BEGIN_BATCH(8);
+       OUT_BATCH(XY_SRC_COPY_BLT_CMD |
+                 XY_SRC_COPY_BLT_WRITE_ALPHA |
+                 XY_SRC_COPY_BLT_WRITE_RGB |
+                 cmd_bits);
+       OUT_BATCH((3 << 24) | /* 32 bits */
+                 (0xcc << 16) | /* copy ROP */
+                 dst_pitch);
+       OUT_BATCH(0); /* dst x1,y1 */
+       OUT_BATCH((height << 16) | width); /* dst x2,y2 */
+       OUT_RELOC(dst_bo, I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER, 0);
+       OUT_BATCH(0); /* src x1,y1 */
+       OUT_BATCH(src_pitch);
+       OUT_RELOC(src_bo, I915_GEM_DOMAIN_RENDER, 0, 0);
+       ADVANCE_BATCH();
+
+       intel_batchbuffer_flush(batch);
+}
+
+static drm_intel_bo *
+create_bo(void)
+{
+       drm_intel_bo *bo, *linear_bo;
+       uint32_t *linear;
+       uint32_t tiling = I915_TILING_X;
+       int ret, i;
+       int val = 0;
+
+       bo = drm_intel_bo_alloc(bufmgr, "tiled bo", size, 4096);
+       ret = drm_intel_bo_set_tiling(bo, &tiling, width * 4);
+       assert(ret == 0);
+       assert(tiling == I915_TILING_X);
+       linear_bo = drm_intel_bo_alloc(bufmgr, "linear src", size, 4096);
+
+       /* Fill the BO with dwords starting at start_val */
+       drm_intel_bo_map(linear_bo, 1);
+       linear = linear_bo->virtual;
+
+       for (i = 0; i < 1024 * 1024 / 4; i++)
+               linear[i] = val++;
+       drm_intel_bo_unmap(linear_bo);
+
+       copy_bo(bo, linear_bo);
+
+       drm_intel_bo_unreference(linear_bo);
+
+       return bo;
+}
+
+static int
+swizzle_bit(int bit, int offset)
+{
+       return (offset & (1 << bit)) >> (bit - 6);
+}
+
+/* Translate from a swizzled offset in the tiled buffer to the corresponding
+ * value from the original linear buffer.
+ */
+static uint32_t
+calculate_expected(int offset)
+{
+       int tile_off = offset & (PAGE_SIZE - 1);
+       int tile_base = offset - tile_off;
+       int tile_index = tile_base / PAGE_SIZE;
+       int tiles_per_row = width / (512 / 4); /* X tiled = 512b rows */
+
+       /* base x,y values from the tile (page) index. */
+       int base_y = tile_index / tiles_per_row * 8;
+       int base_x = tile_index % tiles_per_row * 128;
+
+       assert((offset % 4) == 0);
+       /* x, y offsets within the tile */
+       int tile_y = tile_off / 512;
+       int tile_x = (tile_off % 512) / 4;
+
+       /* printf("%3d, %3d, %3d,%3d\n", base_x, base_y, tile_x, tile_y); */
+       return (base_y + tile_y) * width + base_x + tile_x;
+}
+
+int
+main(int argc, char **argv)
+{
+       int fd;
+       drm_intel_bo *bo;
+       int i, iter = 100;
+       uint32_t buf[width * height];
+       uint32_t tiling, swizzle;
+
+       fd = drm_open_any();
+       intel_get_drm_devid(fd);
+
+       bufmgr = drm_intel_bufmgr_gem_init(fd, 4096);
+       drm_intel_bufmgr_gem_enable_reuse(bufmgr);
+       batch = intel_batchbuffer_alloc(bufmgr);
+
+       bo = create_bo();
+
+       drm_intel_bo_get_tiling(bo, &tiling, &swizzle);
+
+       /* Read a bunch of random subsets of the data and check that they come
+        * out right.
+        */
+       for (i = 0; i < iter; i++) {
+               int offset = (random() % size) & ~3;
+               int len = (random() % size) & ~3;
+               int j;
+
+               if (len == 0)
+                       len = 4;
+
+               if (offset + len > size)
+                       len = size - offset;
+
+               /* For sanity of reporting, make the first iteration be the
+                * whole buffer.
+                */
+               if (i == 0) {
+                       offset = 0;
+                       len = size;
+               }
+
+               drm_intel_bo_get_subdata(bo, offset, len, buf);
+
+               /* Translate from offsets in the read buffer to the swizzled
+                * address that it corresponds to.  This is the opposite of
+                * what Mesa does (calculate offset to be read given the linear
+                * offset it's looking for).
+                */
+               for (j = offset; j < offset + len; j += 4) {
+                       uint32_t expected_val, found_val;
+                       int swizzled_offset;
+
+                       switch (swizzle) {
+                       case I915_BIT_6_SWIZZLE_NONE:
+                               swizzled_offset = j;
+                               break;
+                       case I915_BIT_6_SWIZZLE_9:
+                               swizzled_offset = j ^
+                                       swizzle_bit(9, j);
+                               break;
+                       case I915_BIT_6_SWIZZLE_9_10:
+                               swizzled_offset = j ^
+                                       swizzle_bit(9, j) ^
+                                       swizzle_bit(10, j);
+                               break;
+                       case I915_BIT_6_SWIZZLE_9_11:
+                               swizzled_offset = j ^
+                                       swizzle_bit(9, j) ^
+                                       swizzle_bit(11, j);
+                               break;
+                       case I915_BIT_6_SWIZZLE_9_10_11:
+                               swizzled_offset = j ^
+                                       swizzle_bit(9, j) ^
+                                       swizzle_bit(10, j) ^
+                                       swizzle_bit(11, j);
+                               break;
+                       default:
+                               fprintf(stderr, "Bad swizzle bits; %d\n",
+                                       swizzle);
+                               abort();
+                       }
+                       expected_val = calculate_expected(swizzled_offset);
+                       found_val = buf[(j - offset) / 4];
+                       if (expected_val != found_val) {
+                               fprintf(stderr,
+                                       "Bad read: %d instead of %d at 0x%08x "
+                                       "for read from 0x%08x to 0x%08x\n",
+                                       found_val, expected_val, j,
+                                       offset, offset + len);
+                               abort();
+                       }
+               }
+       }
+
+       drm_intel_bo_unreference(bo);
+
+       intel_batchbuffer_free(batch);
+       drm_intel_bufmgr_destroy(bufmgr);
+
+       close(fd);
+
+       return 0;
+}