OSDN Git Service

ilo: enable bo reuse
[android-x86/external-mesa.git] / src / gallium / drivers / ilo / ilo_screen.c
index 731dc3d..82b98a0 100644 (file)
  */
 
 #include "util/u_format_s3tc.h"
+#include "vl/vl_decoder.h"
+#include "vl/vl_video_buffer.h"
 #include "intel_chipset.h"
+#include "intel_reg.h" /* for TIMESTAMP */
 #include "intel_winsys.h"
 
 #include "ilo_context.h"
 #include "ilo_public.h"
 #include "ilo_screen.h"
 
+int ilo_debug;
+
+static const struct debug_named_value ilo_debug_flags[] = {
+   { "3d",        ILO_DEBUG_3D,       "Dump 3D commands and states" },
+   { "vs",        ILO_DEBUG_VS,       "Dump vertex shaders" },
+   { "gs",        ILO_DEBUG_GS,       "Dump geometry shaders" },
+   { "fs",        ILO_DEBUG_FS,       "Dump fragment shaders" },
+   { "cs",        ILO_DEBUG_CS,       "Dump compute shaders" },
+   { "nohw",      ILO_DEBUG_NOHW,     "Do not send commands to HW" },
+   { "nocache",   ILO_DEBUG_NOCACHE,  "Always invalidate HW caches" },
+   DEBUG_NAMED_VALUE_END
+};
+
+static float
+ilo_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
+{
+   switch (param) {
+   case PIPE_CAPF_MAX_LINE_WIDTH:
+      /* in U3.7, defined in 3DSTATE_SF */
+      return 7.0f;
+   case PIPE_CAPF_MAX_LINE_WIDTH_AA:
+      /* line width minus one, which is reserved for AA region */
+      return 6.0f;
+   case PIPE_CAPF_MAX_POINT_WIDTH:
+      /* in U8.3, defined in 3DSTATE_SF */
+      return 255.0f;
+   case PIPE_CAPF_MAX_POINT_WIDTH_AA:
+      /* same as point width, as we ignore rasterizer->point_smooth */
+      return 255.0f;
+   case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
+      /* [2.0, 16.0], defined in SAMPLER_STATE */
+      return 16.0f;
+   case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
+      /* [-16.0, 16.0), defined in SAMPLER_STATE */
+      return 15.0f;
+   case PIPE_CAPF_GUARD_BAND_LEFT:
+   case PIPE_CAPF_GUARD_BAND_TOP:
+   case PIPE_CAPF_GUARD_BAND_RIGHT:
+   case PIPE_CAPF_GUARD_BAND_BOTTOM:
+      /* what are these for? */
+      return 0.0f;
+
+   default:
+      return 0.0f;
+   }
+}
+
+static int
+ilo_get_shader_param(struct pipe_screen *screen, unsigned shader,
+                     enum pipe_shader_cap param)
+{
+   switch (shader) {
+   case PIPE_SHADER_FRAGMENT:
+   case PIPE_SHADER_VERTEX:
+   case PIPE_SHADER_GEOMETRY:
+      break;
+   default:
+      return 0;
+   }
+
+   switch (param) {
+   /* the limits are copied from the classic driver */
+   case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 16384;
+   case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
+   case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
+   case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 1024 : 0;
+   case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
+      return UINT_MAX;
+   case PIPE_SHADER_CAP_MAX_INPUTS:
+      /* this is limited by how many attributes SF can remap */
+      return 16;
+   case PIPE_SHADER_CAP_MAX_CONSTS:
+      return 1024;
+   case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
+      return ILO_MAX_CONST_BUFFERS;
+   case PIPE_SHADER_CAP_MAX_TEMPS:
+      return 256;
+   case PIPE_SHADER_CAP_MAX_ADDRS:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 0 : 1;
+   case PIPE_SHADER_CAP_MAX_PREDS:
+      return 0;
+   case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
+      return 1;
+   case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
+      return 0;
+   case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
+      return 0;
+   case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
+      return (shader == PIPE_SHADER_FRAGMENT) ? 0 : 1;
+   case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
+      return 1;
+   case PIPE_SHADER_CAP_SUBROUTINES:
+      return 0;
+   case PIPE_SHADER_CAP_INTEGERS:
+      return 1;
+   case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
+      return ILO_MAX_SAMPLERS;
+   case PIPE_SHADER_CAP_PREFERRED_IR:
+      return PIPE_SHADER_IR_TGSI;
+   case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
+      return 1;
+
+   default:
+      return 0;
+   }
+}
+
+static int
+ilo_get_video_param(struct pipe_screen *screen,
+                    enum pipe_video_profile profile,
+                    enum pipe_video_cap param)
+{
+   switch (param) {
+   case PIPE_VIDEO_CAP_SUPPORTED:
+      return vl_profile_supported(screen, profile);
+   case PIPE_VIDEO_CAP_NPOT_TEXTURES:
+      return 1;
+   case PIPE_VIDEO_CAP_MAX_WIDTH:
+   case PIPE_VIDEO_CAP_MAX_HEIGHT:
+      return vl_video_buffer_max_size(screen);
+   case PIPE_VIDEO_CAP_PREFERED_FORMAT:
+      return PIPE_FORMAT_NV12;
+   case PIPE_VIDEO_CAP_PREFERS_INTERLACED:
+      return 1;
+   case PIPE_VIDEO_CAP_SUPPORTS_PROGRESSIVE:
+      return 1;
+   case PIPE_VIDEO_CAP_SUPPORTS_INTERLACED:
+      return 0;
+
+   default:
+      return 0;
+   }
+}
+
+static int
+ilo_get_compute_param(struct pipe_screen *screen,
+                      enum pipe_compute_cap param,
+                      void *ret)
+{
+   union {
+      const char *ir_target;
+      uint64_t grid_dimension;
+      uint64_t max_grid_size[3];
+      uint64_t max_block_size[3];
+      uint64_t max_threads_per_block;
+      uint64_t max_global_size;
+      uint64_t max_local_size;
+      uint64_t max_private_size;
+      uint64_t max_input_size;
+      uint64_t max_mem_alloc_size;
+   } val;
+   const void *ptr;
+   int size;
+
+   /* XXX some randomly chosen values */
+   switch (param) {
+   case PIPE_COMPUTE_CAP_IR_TARGET:
+      val.ir_target = "ilog";
+
+      ptr = val.ir_target;
+      size = strlen(val.ir_target) + 1;
+      break;
+   case PIPE_COMPUTE_CAP_GRID_DIMENSION:
+      val.grid_dimension = Elements(val.max_grid_size);
+
+      ptr = &val.grid_dimension;
+      size = sizeof(val.grid_dimension);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
+      val.max_grid_size[0] = 65535;
+      val.max_grid_size[1] = 65535;
+      val.max_grid_size[2] = 1;
+
+      ptr = &val.max_grid_size;
+      size = sizeof(val.max_grid_size);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
+      val.max_block_size[0] = 512;
+      val.max_block_size[1] = 512;
+      val.max_block_size[2] = 512;
+
+      ptr = &val.max_block_size;
+      size = sizeof(val.max_block_size);
+      break;
+
+   case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
+      val.max_threads_per_block = 512;
+
+      ptr = &val.max_threads_per_block;
+      size = sizeof(val.max_threads_per_block);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
+      val.max_global_size = 4;
+
+      ptr = &val.max_global_size;
+      size = sizeof(val.max_global_size);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
+      val.max_local_size = 64 * 1024;
+
+      ptr = &val.max_local_size;
+      size = sizeof(val.max_local_size);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
+      val.max_private_size = 32768;
+
+      ptr = &val.max_private_size;
+      size = sizeof(val.max_private_size);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
+      val.max_input_size = 256;
+
+      ptr = &val.max_input_size;
+      size = sizeof(val.max_input_size);
+      break;
+   case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
+      val.max_mem_alloc_size = 128 * 1024 * 1024;
+
+      ptr = &val.max_mem_alloc_size;
+      size = sizeof(val.max_mem_alloc_size);
+      break;
+   default:
+      ptr = NULL;
+      size = 0;
+      break;
+   }
+
+   if (ret)
+      memcpy(ret, ptr, size);
+
+   return size;
+}
+
+static int
+ilo_get_param(struct pipe_screen *screen, enum pipe_cap param)
+{
+   struct ilo_screen *is = ilo_screen(screen);
+
+   switch (param) {
+   case PIPE_CAP_NPOT_TEXTURES:
+   case PIPE_CAP_TWO_SIDED_STENCIL:
+      return true;
+   case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
+      return 0; /* TODO */
+   case PIPE_CAP_ANISOTROPIC_FILTER:
+   case PIPE_CAP_POINT_SPRITE:
+      return true;
+   case PIPE_CAP_MAX_RENDER_TARGETS:
+      return ILO_MAX_DRAW_BUFFERS;
+   case PIPE_CAP_OCCLUSION_QUERY:
+   case PIPE_CAP_QUERY_TIME_ELAPSED:
+   case PIPE_CAP_TEXTURE_SHADOW_MAP:
+   case PIPE_CAP_TEXTURE_SWIZZLE: /* must be supported for shadow map */
+      return true;
+   case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
+      /*
+       * As defined in SURFACE_STATE, we have
+       *
+       *           Max WxHxD for 2D and CUBE     Max WxHxD for 3D
+       *  GEN6           8192x8192x512            2048x2048x2048
+       *  GEN7         16384x16384x2048           2048x2048x2048
+       *
+       * However, when the texutre size is large, things become unstable.  We
+       * require the maximum texture size to be 2^30 bytes in
+       * screen->can_create_resource().  Since the maximum pixel size is 2^4
+       * bytes (PIPE_FORMAT_R32G32B32A32_FLOAT), textures should not have more
+       * than 2^26 pixels.
+       *
+       * For 3D textures, we have to set the maximum number of levels to 9,
+       * which has at most 2^24 pixels.  For 2D textures, we set it to 14,
+       * which has at most 2^26 pixels.
+       */
+      return 14;
+   case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
+      return 9;
+   case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
+      return 14;
+   case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
+      return false;
+   case PIPE_CAP_BLEND_EQUATION_SEPARATE:
+   case PIPE_CAP_SM3:
+      return true;
+   case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
+      if (is->dev.gen >= ILO_GEN(7) && !is->dev.has_gen7_sol_reset)
+         return 0;
+      return ILO_MAX_SO_BUFFERS;
+   case PIPE_CAP_PRIMITIVE_RESTART:
+      return true;
+   case PIPE_CAP_MAX_COMBINED_SAMPLERS:
+      return ILO_MAX_SAMPLERS * 2;
+   case PIPE_CAP_INDEP_BLEND_ENABLE:
+   case PIPE_CAP_INDEP_BLEND_FUNC:
+      return true;
+   case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
+      return (is->dev.gen >= ILO_GEN(7)) ? 2048 : 512;
+   case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
+   case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
+   case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
+   case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
+   case PIPE_CAP_DEPTH_CLIP_DISABLE:
+      return true;
+   case PIPE_CAP_SHADER_STENCIL_EXPORT:
+      return false;
+   case PIPE_CAP_TGSI_INSTANCEID:
+   case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
+      return true;
+   case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
+      return false;
+   case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
+      return true;
+   case PIPE_CAP_SEAMLESS_CUBE_MAP:
+   case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
+   case PIPE_CAP_SCALED_RESOLVE:
+      return true;
+   case PIPE_CAP_MIN_TEXEL_OFFSET:
+      return -8;
+   case PIPE_CAP_MAX_TEXEL_OFFSET:
+      return 7;
+   case PIPE_CAP_CONDITIONAL_RENDER:
+   case PIPE_CAP_TEXTURE_BARRIER:
+      return true;
+   case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
+      return ILO_MAX_SO_BINDINGS / ILO_MAX_SO_BUFFERS;
+   case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
+      return ILO_MAX_SO_BINDINGS;
+   case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
+      if (is->dev.gen >= ILO_GEN(7))
+         return is->dev.has_gen7_sol_reset;
+      else
+         return false; /* TODO */
+   case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS:
+   case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
+      return false;
+   case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
+      return true;
+   case PIPE_CAP_VERTEX_COLOR_CLAMPED:
+      return false;
+   case PIPE_CAP_GLSL_FEATURE_LEVEL:
+      return 130;
+   case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
+   case PIPE_CAP_USER_VERTEX_BUFFERS:
+      return false;
+   case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
+   case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
+   case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
+      return false;
+   case PIPE_CAP_COMPUTE:
+      return false; /* TODO */
+   case PIPE_CAP_USER_INDEX_BUFFERS:
+      return false;
+   case PIPE_CAP_USER_CONSTANT_BUFFERS:
+      return false; /* TODO push constants */
+   case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
+      /* imposed by OWord (Dual) Block Read */
+      return 16;
+   case PIPE_CAP_START_INSTANCE:
+   case PIPE_CAP_QUERY_TIMESTAMP:
+      return true;
+   case PIPE_CAP_TEXTURE_MULTISAMPLE:
+      return false; /* TODO */
+   case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
+      return 0; /* TODO */
+   case PIPE_CAP_CUBE_MAP_ARRAY:
+      return false; /* TODO */
+   case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
+      return true;
+   case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
+      return 1;
+   case PIPE_CAP_TGSI_TEXCOORD:
+      return false;
+   case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
+      return true;
+   case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
+      return false; /* TODO */
+   case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
+      return 0;
+   case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
+      /* a BRW_SURFACE_BUFFER can have up to 2^27 elements */
+      return 1 << 27;
+   case PIPE_CAP_MAX_VIEWPORTS:
+      return ILO_MAX_VIEWPORTS;
+
+   default:
+      return 0;
+   }
+}
+
+static const char *
+ilo_get_vendor(struct pipe_screen *screen)
+{
+   return "LunarG, Inc.";
+}
+
+static const char *
+ilo_get_name(struct pipe_screen *screen)
+{
+   struct ilo_screen *is = ilo_screen(screen);
+   const char *chipset;
+
+   /* stolen from classic i965 */
+   switch (is->dev.devid) {
+   case PCI_CHIP_SANDYBRIDGE_GT1:
+   case PCI_CHIP_SANDYBRIDGE_GT2:
+   case PCI_CHIP_SANDYBRIDGE_GT2_PLUS:
+      chipset = "Intel(R) Sandybridge Desktop";
+      break;
+   case PCI_CHIP_SANDYBRIDGE_M_GT1:
+   case PCI_CHIP_SANDYBRIDGE_M_GT2:
+   case PCI_CHIP_SANDYBRIDGE_M_GT2_PLUS:
+      chipset = "Intel(R) Sandybridge Mobile";
+      break;
+   case PCI_CHIP_SANDYBRIDGE_S:
+      chipset = "Intel(R) Sandybridge Server";
+      break;
+   case PCI_CHIP_IVYBRIDGE_GT1:
+   case PCI_CHIP_IVYBRIDGE_GT2:
+      chipset = "Intel(R) Ivybridge Desktop";
+      break;
+   case PCI_CHIP_IVYBRIDGE_M_GT1:
+   case PCI_CHIP_IVYBRIDGE_M_GT2:
+      chipset = "Intel(R) Ivybridge Mobile";
+      break;
+   case PCI_CHIP_IVYBRIDGE_S_GT1:
+   case PCI_CHIP_IVYBRIDGE_S_GT2:
+      chipset = "Intel(R) Ivybridge Server";
+      break;
+   case PCI_CHIP_BAYTRAIL_M_1:
+   case PCI_CHIP_BAYTRAIL_M_2:
+   case PCI_CHIP_BAYTRAIL_M_3:
+   case PCI_CHIP_BAYTRAIL_M_4:
+   case PCI_CHIP_BAYTRAIL_D:
+      chipset = "Intel(R) Bay Trail";
+      break;
+   case PCI_CHIP_HASWELL_GT1:
+   case PCI_CHIP_HASWELL_GT2:
+   case PCI_CHIP_HASWELL_GT3:
+   case PCI_CHIP_HASWELL_SDV_GT1:
+   case PCI_CHIP_HASWELL_SDV_GT2:
+   case PCI_CHIP_HASWELL_SDV_GT3:
+   case PCI_CHIP_HASWELL_ULT_GT1:
+   case PCI_CHIP_HASWELL_ULT_GT2:
+   case PCI_CHIP_HASWELL_ULT_GT3:
+   case PCI_CHIP_HASWELL_CRW_GT1:
+   case PCI_CHIP_HASWELL_CRW_GT2:
+   case PCI_CHIP_HASWELL_CRW_GT3:
+      chipset = "Intel(R) Haswell Desktop";
+      break;
+   case PCI_CHIP_HASWELL_M_GT1:
+   case PCI_CHIP_HASWELL_M_GT2:
+   case PCI_CHIP_HASWELL_M_GT3:
+   case PCI_CHIP_HASWELL_SDV_M_GT1:
+   case PCI_CHIP_HASWELL_SDV_M_GT2:
+   case PCI_CHIP_HASWELL_SDV_M_GT3:
+   case PCI_CHIP_HASWELL_ULT_M_GT1:
+   case PCI_CHIP_HASWELL_ULT_M_GT2:
+   case PCI_CHIP_HASWELL_ULT_M_GT3:
+   case PCI_CHIP_HASWELL_CRW_M_GT1:
+   case PCI_CHIP_HASWELL_CRW_M_GT2:
+   case PCI_CHIP_HASWELL_CRW_M_GT3:
+      chipset = "Intel(R) Haswell Mobile";
+      break;
+   case PCI_CHIP_HASWELL_S_GT1:
+   case PCI_CHIP_HASWELL_S_GT2:
+   case PCI_CHIP_HASWELL_S_GT3:
+   case PCI_CHIP_HASWELL_SDV_S_GT1:
+   case PCI_CHIP_HASWELL_SDV_S_GT2:
+   case PCI_CHIP_HASWELL_SDV_S_GT3:
+   case PCI_CHIP_HASWELL_ULT_S_GT1:
+   case PCI_CHIP_HASWELL_ULT_S_GT2:
+   case PCI_CHIP_HASWELL_ULT_S_GT3:
+   case PCI_CHIP_HASWELL_CRW_S_GT1:
+   case PCI_CHIP_HASWELL_CRW_S_GT2:
+   case PCI_CHIP_HASWELL_CRW_S_GT3:
+      chipset = "Intel(R) Haswell Server";
+      break;
+   default:
+      chipset = "Unknown Intel Chipset";
+      break;
+   }
+
+   return chipset;
+}
+
+static uint64_t
+ilo_get_timestamp(struct pipe_screen *screen)
+{
+   struct ilo_screen *is = ilo_screen(screen);
+   union {
+      uint64_t val;
+      uint32_t dw[2];
+   } timestamp;
+
+   is->winsys->read_reg(is->winsys, TIMESTAMP, &timestamp.val);
+
+   /*
+    * From the Ivy Bridge PRM, volume 1 part 3, page 107:
+    *
+    *     "Note: This timestamp register reflects the value of the PCU TSC.
+    *      The PCU TSC counts 10ns increments; this timestamp reflects bits
+    *      38:3 of the TSC (i.e. 80ns granularity, rolling over every 1.5
+    *      hours)."
+    *
+    * However, it seems dw[0] is garbage and dw[1] contains the lower 32 bits
+    * of the timestamp.  We will have to live with a timestamp that rolls over
+    * every ~343 seconds.
+    *
+    * See also brw_get_timestamp().
+    */
+   return (uint64_t) timestamp.dw[1] * 80;
+}
+
+static void
+ilo_fence_reference(struct pipe_screen *screen,
+                    struct pipe_fence_handle **p,
+                    struct pipe_fence_handle *f)
+{
+   struct ilo_fence **ptr = (struct ilo_fence **) p;
+   struct ilo_fence *fence = ilo_fence(f);
+
+   if (!ptr) {
+      /* still need to reference fence */
+      if (fence)
+         pipe_reference(NULL, &fence->reference);
+      return;
+   }
+
+   /* reference fence and dereference the one pointed to by ptr */
+   if (*ptr && pipe_reference(&(*ptr)->reference, &fence->reference)) {
+      struct ilo_fence *old = *ptr;
+
+      if (old->bo)
+         old->bo->unreference(old->bo);
+      FREE(old);
+   }
+
+   *ptr = fence;
+}
+
+static boolean
+ilo_fence_signalled(struct pipe_screen *screen,
+                    struct pipe_fence_handle *f)
+{
+   struct ilo_fence *fence = ilo_fence(f);
+
+   /* mark signalled if the bo is idle */
+   if (fence->bo && !intel_bo_is_busy(fence->bo)) {
+      fence->bo->unreference(fence->bo);
+      fence->bo = NULL;
+   }
+
+   return (fence->bo == NULL);
+}
+
+static boolean
+ilo_fence_finish(struct pipe_screen *screen,
+                 struct pipe_fence_handle *f,
+                 uint64_t timeout)
+{
+   struct ilo_fence *fence = ilo_fence(f);
+   const int64_t wait_timeout = (timeout > INT64_MAX) ? -1 : timeout;
+
+   /* already signalled */
+   if (!fence->bo)
+      return true;
+
+   /* wait and see if it returns error */
+   if (fence->bo->wait(fence->bo, wait_timeout))
+      return false;
+
+   /* mark signalled */
+   fence->bo->unreference(fence->bo);
+   fence->bo = NULL;
+
+   return true;
+}
+
 static void
 ilo_screen_destroy(struct pipe_screen *screen)
 {
@@ -46,53 +629,118 @@ ilo_screen_destroy(struct pipe_screen *screen)
    FREE(is);
 }
 
+static bool
+init_dev(struct ilo_dev_info *dev, const struct intel_winsys_info *info)
+{
+   dev->devid = info->devid;
+   dev->has_llc = info->has_llc;
+   dev->has_gen7_sol_reset = info->has_gen7_sol_reset;
+   dev->has_address_swizzling = info->has_address_swizzling;
+
+   /*
+    * From the Sandy Bridge PRM, volume 4 part 2, page 18:
+    *
+    *     "[DevSNB]: The GT1 product's URB provides 32KB of storage, arranged
+    *      as 1024 256-bit rows. The GT2 product's URB provides 64KB of
+    *      storage, arranged as 2048 256-bit rows. A row corresponds in size
+    *      to an EU GRF register. Read/write access to the URB is generally
+    *      supported on a row-granular basis."
+    *
+    * From the Ivy Bridge PRM, volume 4 part 2, page 17:
+    *
+    *     "URB Size    URB Rows    URB Rows when SLM Enabled
+    *      128k        4096        2048
+    *      256k        8096        4096"
+    */
+
+   if (IS_HASWELL(info->devid)) {
+      dev->gen = ILO_GEN(7.5);
+
+      if (IS_HSW_GT3(info->devid)) {
+         dev->gt = 3;
+         dev->urb_size = 512 * 1024;
+      }
+      else if (IS_HSW_GT2(info->devid)) {
+         dev->gt = 2;
+         dev->urb_size = 256 * 1024;
+      }
+      else {
+         dev->gt = 1;
+         dev->urb_size = 128 * 1024;
+      }
+   }
+   else if (IS_GEN7(info->devid)) {
+      dev->gen = ILO_GEN(7);
+
+      if (IS_IVB_GT2(info->devid)) {
+         dev->gt = 2;
+         dev->urb_size = 256 * 1024;
+      }
+      else {
+         dev->gt = 1;
+         dev->urb_size = 128 * 1024;
+      }
+   }
+   else if (IS_GEN6(info->devid)) {
+      dev->gen = ILO_GEN(6);
+
+      if (IS_SNB_GT2(info->devid)) {
+         dev->gt = 2;
+         dev->urb_size = 64 * 1024;
+      }
+      else {
+         dev->gt = 1;
+         dev->urb_size = 32 * 1024;
+      }
+   }
+   else {
+      ilo_err("unknown GPU generation\n");
+      return false;
+   }
+
+   return true;
+}
+
 struct pipe_screen *
 ilo_screen_create(struct intel_winsys *ws)
 {
    struct ilo_screen *is;
    const struct intel_winsys_info *info;
 
+   ilo_debug = debug_get_flags_option("ILO_DEBUG", ilo_debug_flags, 0);
+
    is = CALLOC_STRUCT(ilo_screen);
    if (!is)
       return NULL;
 
    is->winsys = ws;
 
-   info = is->winsys->get_info(is->winsys);
+   is->winsys->enable_reuse(is->winsys);
 
-   is->devid = info->devid;
-   if (IS_GEN7(info->devid)) {
-      is->gen = ILO_GEN(7);
-   }
-   else if (IS_GEN6(info->devid)) {
-      is->gen = ILO_GEN(6);
-   }
-   else {
-      ilo_err("unknown GPU generation\n");
+   info = is->winsys->get_info(is->winsys);
+   if (!init_dev(&is->dev, info)) {
       FREE(is);
       return NULL;
    }
 
-   is->has_llc = info->has_llc;
-
    util_format_s3tc_init();
 
    is->base.destroy = ilo_screen_destroy;
-   is->base.get_name = NULL;
-   is->base.get_vendor = NULL;
-   is->base.get_param = NULL;
-   is->base.get_paramf = NULL;
-   is->base.get_shader_param = NULL;
-   is->base.get_video_param = NULL;
-   is->base.get_compute_param = NULL;
+   is->base.get_name = ilo_get_name;
+   is->base.get_vendor = ilo_get_vendor;
+   is->base.get_param = ilo_get_param;
+   is->base.get_paramf = ilo_get_paramf;
+   is->base.get_shader_param = ilo_get_shader_param;
+   is->base.get_video_param = ilo_get_video_param;
+   is->base.get_compute_param = ilo_get_compute_param;
 
-   is->base.get_timestamp = NULL;
+   is->base.get_timestamp = ilo_get_timestamp;
 
    is->base.flush_frontbuffer = NULL;
 
-   is->base.fence_reference = NULL;
-   is->base.fence_signalled = NULL;
-   is->base.fence_finish = NULL;
+   is->base.fence_reference = ilo_fence_reference;
+   is->base.fence_signalled = ilo_fence_signalled;
+   is->base.fence_finish = ilo_fence_finish;
 
    is->base.get_driver_query_info = NULL;