vmwgfx: Make it possible to get fence from execbuf

[linux-2.6.git] / drivers / gpu / drm / vmwgfx / vmwgfx_execbuf.c
diff --git a/drivers/gpu/drm/vmwgfx/vmwgfx_execbuf.c b/drivers/gpu/drm/vmwgfx/vmwgfx_execbuf.c

index cc8c08b35102d3c00101119d4ae19d5a58dfcb9f..4acced44a623428a0ee60d2973763f81d126b36b 100644 (file)
--- a/drivers/gpu/drm/vmwgfx/vmwgfx_execbuf.c
+++ b/drivers/gpu/drm/vmwgfx/vmwgfx_execbuf.c
@@ -44,28 +44,63 @@ static int vmw_cmd_ok(struct vmw_private *dev_priv,
         return 0;
  }
  
-
-static int vmw_resource_to_validate_list(struct vmw_sw_context *sw_context,
-                                        struct vmw_resource **p_res)
+static void vmw_resource_to_validate_list(struct vmw_sw_context *sw_context,
+                                         struct vmw_resource **p_res)
  {
-       int ret = 0;
         struct vmw_resource *res = *p_res;
  
-       if (!res->on_validate_list) {
-               if (sw_context->num_ref_resources >= VMWGFX_MAX_VALIDATIONS) {
-                       DRM_ERROR("Too many resources referenced in "
-                                 "command stream.\n");
-                       ret = -ENOMEM;
-                       goto out;
-               }
-               sw_context->resources[sw_context->num_ref_resources++] = res;
-               res->on_validate_list = true;
-               return 0;
+       if (list_empty(&res->validate_head)) {
+               list_add_tail(&res->validate_head, &sw_context->resource_list);
+               *p_res = NULL;
+       } else
+               vmw_resource_unreference(p_res);
+}
+
+/**
+ * vmw_bo_to_validate_list - add a bo to a validate list
+ *
+ * @sw_context: The software context used for this command submission batch.
+ * @bo: The buffer object to add.
+ * @fence_flags: Fence flags to be or'ed with any other fence flags for
+ * this buffer on this submission batch.
+ * @p_val_node: If non-NULL Will be updated with the validate node number
+ * on return.
+ *
+ * Returns -EINVAL if the limit of number of buffer objects per command
+ * submission is reached.
+ */
+static int vmw_bo_to_validate_list(struct vmw_sw_context *sw_context,
+                                  struct ttm_buffer_object *bo,
+                                  uint32_t fence_flags,
+                                  uint32_t *p_val_node)
+{
+       uint32_t val_node;
+       struct ttm_validate_buffer *val_buf;
+
+       val_node = vmw_dmabuf_validate_node(bo, sw_context->cur_val_buf);
+
+       if (unlikely(val_node >= VMWGFX_MAX_VALIDATIONS)) {
+               DRM_ERROR("Max number of DMA buffers per submission"
+                         " exceeded.\n");
+               return -EINVAL;
         }
  
-out:
-       vmw_resource_unreference(p_res);
-       return ret;
+       val_buf = &sw_context->val_bufs[val_node];
+       if (unlikely(val_node == sw_context->cur_val_buf)) {
+               val_buf->new_sync_obj_arg = NULL;
+               val_buf->bo = ttm_bo_reference(bo);
+               list_add_tail(&val_buf->head, &sw_context->validate_nodes);
+               ++sw_context->cur_val_buf;
+       }
+
+       val_buf->new_sync_obj_arg = (void *)
+               ((unsigned long) val_buf->new_sync_obj_arg | fence_flags);
+       sw_context->fence_flags |= fence_flags;
+
+       if (p_val_node)
+               *p_val_node = val_node;
+
+       return 0;
  }
  
  static int vmw_cmd_cid_check(struct vmw_private *dev_priv,
@@ -94,7 +129,10 @@ static int vmw_cmd_cid_check(struct vmw_private *dev_priv,
  
         sw_context->last_cid = cmd->cid;
         sw_context->cid_valid = true;
-       return vmw_resource_to_validate_list(sw_context, &ctx);
+       sw_context->cur_ctx = ctx;
+       vmw_resource_to_validate_list(sw_context, &ctx);
+
+       return 0;
  }
  
  static int vmw_cmd_sid_check(struct vmw_private *dev_priv,
@@ -114,7 +152,8 @@ static int vmw_cmd_sid_check(struct vmw_private *dev_priv,
                 return 0;
         }
  
-       ret = vmw_user_surface_lookup_handle(dev_priv, sw_context->tfile,
+       ret = vmw_user_surface_lookup_handle(dev_priv,
+                                            sw_context->tfile,
                                              *sid, &srf);
         if (unlikely(ret != 0)) {
                 DRM_ERROR("Could ot find or use surface 0x%08x "
@@ -124,13 +163,23 @@ static int vmw_cmd_sid_check(struct vmw_private *dev_priv,
                 return ret;
         }
  
+       ret = vmw_surface_validate(dev_priv, srf);
+       if (unlikely(ret != 0)) {
+               if (ret != -ERESTARTSYS)
+                       DRM_ERROR("Could not validate surface.\n");
+               vmw_surface_unreference(&srf);
+               return ret;
+       }
+
         sw_context->last_sid = *sid;
         sw_context->sid_valid = true;
         sw_context->sid_translation = srf->res.id;
         *sid = sw_context->sid_translation;
  
         res = &srf->res;
-       return vmw_resource_to_validate_list(sw_context, &res);
+       vmw_resource_to_validate_list(sw_context, &res);
+
+       return 0;
  }
  
  
@@ -197,6 +246,12 @@ static int vmw_cmd_blt_surf_screen_check(struct vmw_private *dev_priv,
         } *cmd;
  
         cmd = container_of(header, struct vmw_sid_cmd, header);
+
+       if (unlikely(!sw_context->kernel)) {
+               DRM_ERROR("Kernel only SVGA3d command: %u.\n", cmd->header.id);
+               return -EPERM;
+       }
+
         return vmw_cmd_sid_check(dev_priv, sw_context, &cmd->body.srcImage.sid);
  }
  
@@ -209,10 +264,179 @@ static int vmw_cmd_present_check(struct vmw_private *dev_priv,
                 SVGA3dCmdPresent body;
         } *cmd;
  
+
         cmd = container_of(header, struct vmw_sid_cmd, header);
+
+       if (unlikely(!sw_context->kernel)) {
+               DRM_ERROR("Kernel only SVGA3d command: %u.\n", cmd->header.id);
+               return -EPERM;
+       }
+
         return vmw_cmd_sid_check(dev_priv, sw_context, &cmd->body.sid);
  }
  
+/**
+ * vmw_query_bo_switch_prepare - Prepare to switch pinned buffer for queries.
+ *
+ * @dev_priv: The device private structure.
+ * @cid: The hardware context for the next query.
+ * @new_query_bo: The new buffer holding query results.
+ * @sw_context: The software context used for this command submission.
+ *
+ * This function checks whether @new_query_bo is suitable for holding
+ * query results, and if another buffer currently is pinned for query
+ * results. If so, the function prepares the state of @sw_context for
+ * switching pinned buffers after successful submission of the current
+ * command batch. It also checks whether we're using a new query context.
+ * In that case, it makes sure we emit a query barrier for the old
+ * context before the current query buffer is fenced.
+ */
+static int vmw_query_bo_switch_prepare(struct vmw_private *dev_priv,
+                                      uint32_t cid,
+                                      struct ttm_buffer_object *new_query_bo,
+                                      struct vmw_sw_context *sw_context)
+{
+       int ret;
+       bool add_cid = false;
+       uint32_t cid_to_add;
+
+       if (unlikely(new_query_bo != sw_context->cur_query_bo)) {
+
+               if (unlikely(new_query_bo->num_pages > 4)) {
+                       DRM_ERROR("Query buffer too large.\n");
+                       return -EINVAL;
+               }
+
+               if (unlikely(sw_context->cur_query_bo != NULL)) {
+                       BUG_ON(!sw_context->query_cid_valid);
+                       add_cid = true;
+                       cid_to_add = sw_context->cur_query_cid;
+                       ret = vmw_bo_to_validate_list(sw_context,
+                                                     sw_context->cur_query_bo,
+                                                     DRM_VMW_FENCE_FLAG_EXEC,
+                                                     NULL);
+                       if (unlikely(ret != 0))
+                               return ret;
+               }
+               sw_context->cur_query_bo = new_query_bo;
+
+               ret = vmw_bo_to_validate_list(sw_context,
+                                             dev_priv->dummy_query_bo,
+                                             DRM_VMW_FENCE_FLAG_EXEC,
+                                             NULL);
+               if (unlikely(ret != 0))
+                       return ret;
+
+       }
+
+       if (unlikely(cid != sw_context->cur_query_cid &&
+                    sw_context->query_cid_valid)) {
+               add_cid = true;
+               cid_to_add = sw_context->cur_query_cid;
+       }
+
+       sw_context->cur_query_cid = cid;
+       sw_context->query_cid_valid = true;
+
+       if (add_cid) {
+               struct vmw_resource *ctx = sw_context->cur_ctx;
+
+               if (list_empty(&ctx->query_head))
+                       list_add_tail(&ctx->query_head,
+                                     &sw_context->query_list);
+               ret = vmw_bo_to_validate_list(sw_context,
+                                             dev_priv->dummy_query_bo,
+                                             DRM_VMW_FENCE_FLAG_EXEC,
+                                             NULL);
+               if (unlikely(ret != 0))
+                       return ret;
+       }
+       return 0;
+}
+
+
+/**
+ * vmw_query_bo_switch_commit - Finalize switching pinned query buffer
+ *
+ * @dev_priv: The device private structure.
+ * @sw_context: The software context used for this command submission batch.
+ *
+ * This function will check if we're switching query buffers, and will then,
+ * if no other query waits are issued this command submission batch,
+ * issue a dummy occlusion query wait used as a query barrier. When the fence
+ * object following that query wait has signaled, we are sure that all
+ * preseding queries have finished, and the old query buffer can be unpinned.
+ * However, since both the new query buffer and the old one are fenced with
+ * that fence, we can do an asynchronus unpin now, and be sure that the
+ * old query buffer won't be moved until the fence has signaled.
+ *
+ * As mentioned above, both the new - and old query buffers need to be fenced
+ * using a sequence emitted *after* calling this function.
+ */
+static void vmw_query_bo_switch_commit(struct vmw_private *dev_priv,
+                                    struct vmw_sw_context *sw_context)
+{
+
+       struct vmw_resource *ctx, *next_ctx;
+       int ret;
+
+       /*
+        * The validate list should still hold references to all
+        * contexts here.
+        */
+
+       list_for_each_entry_safe(ctx, next_ctx, &sw_context->query_list,
+                                query_head) {
+               list_del_init(&ctx->query_head);
+
+               BUG_ON(list_empty(&ctx->validate_head));
+
+               ret = vmw_fifo_emit_dummy_query(dev_priv, ctx->id);
+
+               if (unlikely(ret != 0))
+                       DRM_ERROR("Out of fifo space for dummy query.\n");
+       }
+
+       if (dev_priv->pinned_bo != sw_context->cur_query_bo) {
+               if (dev_priv->pinned_bo) {
+                       vmw_bo_pin(dev_priv->pinned_bo, false);
+                       ttm_bo_unref(&dev_priv->pinned_bo);
+               }
+
+               vmw_bo_pin(sw_context->cur_query_bo, true);
+
+               /*
+                * We pin also the dummy_query_bo buffer so that we
+                * don't need to validate it when emitting
+                * dummy queries in context destroy paths.
+                */
+
+               vmw_bo_pin(dev_priv->dummy_query_bo, true);
+               dev_priv->dummy_query_bo_pinned = true;
+
+               dev_priv->query_cid = sw_context->cur_query_cid;
+               dev_priv->pinned_bo =
+                       ttm_bo_reference(sw_context->cur_query_bo);
+       }
+}
+
+/**
+ * vmw_query_switch_backoff - clear query barrier list
+ * @sw_context: The sw context used for this submission batch.
+ *
+ * This function is used as part of an error path, where a previously
+ * set up list of query barriers needs to be cleared.
+ *
+ */
+static void vmw_query_switch_backoff(struct vmw_sw_context *sw_context)
+{
+       struct list_head *list, *next;
+
+       list_for_each_safe(list, next, &sw_context->query_list) {
+               list_del_init(list);
+       }
+}
+
  static int vmw_translate_guest_ptr(struct vmw_private *dev_priv,
                                    struct vmw_sw_context *sw_context,
                                    SVGAGuestPtr *ptr,
@@ -222,8 +446,6 @@ static int vmw_translate_guest_ptr(struct vmw_private *dev_priv,
         struct ttm_buffer_object *bo;
         uint32_t handle = ptr->gmrId;
         struct vmw_relocation *reloc;
-       uint32_t cur_validate_node;
-       struct ttm_validate_buffer *val_buf;
         int ret;
  
         ret = vmw_user_dmabuf_lookup(sw_context->tfile, handle, &vmw_bo);
@@ -243,23 +465,11 @@ static int vmw_translate_guest_ptr(struct vmw_private *dev_priv,
         reloc = &sw_context->relocs[sw_context->cur_reloc++];
         reloc->location = ptr;
  
-       cur_validate_node = vmw_dmabuf_validate_node(bo, sw_context->cur_val_buf);
-       if (unlikely(cur_validate_node >= VMWGFX_MAX_VALIDATIONS)) {
-               DRM_ERROR("Max number of DMA buffers per submission"
-                         " exceeded.\n");
-               ret = -EINVAL;
+       ret = vmw_bo_to_validate_list(sw_context, bo, DRM_VMW_FENCE_FLAG_EXEC,
+                                     &reloc->index);
+       if (unlikely(ret != 0))
                 goto out_no_reloc;
-       }
  
-       reloc->index = cur_validate_node;
-       if (unlikely(cur_validate_node == sw_context->cur_val_buf)) {
-               val_buf = &sw_context->val_bufs[cur_validate_node];
-               val_buf->bo = ttm_bo_reference(bo);
-               val_buf->usage = TTM_USAGE_READWRITE;
-               val_buf->new_sync_obj_arg = (void *) DRM_VMW_FENCE_FLAG_EXEC;
-               list_add_tail(&val_buf->head, &sw_context->validate_nodes);
-               ++sw_context->cur_val_buf;
-       }
         *vmw_bo_p = vmw_bo;
         return 0;
  
@@ -291,8 +501,11 @@ static int vmw_cmd_end_query(struct vmw_private *dev_priv,
         if (unlikely(ret != 0))
                 return ret;
  
+       ret = vmw_query_bo_switch_prepare(dev_priv, cmd->q.cid,
+                                         &vmw_bo->base, sw_context);
+
         vmw_dmabuf_unreference(&vmw_bo);
-       return 0;
+       return ret;
  }
  
  static int vmw_cmd_wait_query(struct vmw_private *dev_priv,
@@ -305,6 +518,7 @@ static int vmw_cmd_wait_query(struct vmw_private *dev_priv,
                 SVGA3dCmdWaitForQuery q;
         } *cmd;
         int ret;
+       struct vmw_resource *ctx;
  
         cmd = container_of(header, struct vmw_query_cmd, header);
         ret = vmw_cmd_cid_check(dev_priv, sw_context, header);
@@ -318,6 +532,16 @@ static int vmw_cmd_wait_query(struct vmw_private *dev_priv,
                 return ret;
  
         vmw_dmabuf_unreference(&vmw_bo);
+
+       /*
+        * This wait will act as a barrier for previous waits for this
+        * context.
+        */
+
+       ctx = sw_context->cur_ctx;
+       if (!list_empty(&ctx->query_head))
+               list_del_init(&ctx->query_head);
+
         return 0;
  }
  
@@ -350,6 +574,13 @@ static int vmw_cmd_dma(struct vmw_private *dev_priv,
                 goto out_no_reloc;
         }
  
+       ret = vmw_surface_validate(dev_priv, srf);
+       if (unlikely(ret != 0)) {
+               if (ret != -ERESTARTSYS)
+                       DRM_ERROR("Culd not validate surface.\n");
+               goto out_no_validate;
+       }
+
         /*
          * Patch command stream with device SID.
          */
@@ -359,8 +590,12 @@ static int vmw_cmd_dma(struct vmw_private *dev_priv,
         vmw_dmabuf_unreference(&vmw_bo);
  
         res = &srf->res;
-       return vmw_resource_to_validate_list(sw_context, &res);
+       vmw_resource_to_validate_list(sw_context, &res);
  
+       return 0;
+
+out_no_validate:
+       vmw_surface_unreference(&srf);
  out_no_reloc:
         vmw_dmabuf_unreference(&vmw_bo);
         return ret;
@@ -450,6 +685,71 @@ static int vmw_cmd_tex_state(struct vmw_private *dev_priv,
         return 0;
  }
  
+static int vmw_cmd_check_define_gmrfb(struct vmw_private *dev_priv,
+                                     struct vmw_sw_context *sw_context,
+                                     void *buf)
+{
+       struct vmw_dma_buffer *vmw_bo;
+       int ret;
+
+       struct {
+               uint32_t header;
+               SVGAFifoCmdDefineGMRFB body;
+       } *cmd = buf;
+
+       ret = vmw_translate_guest_ptr(dev_priv, sw_context,
+                                     &cmd->body.ptr,
+                                     &vmw_bo);
+       if (unlikely(ret != 0))
+               return ret;
+
+       vmw_dmabuf_unreference(&vmw_bo);
+
+       return ret;
+}
+
+static int vmw_cmd_check_not_3d(struct vmw_private *dev_priv,
+                               struct vmw_sw_context *sw_context,
+                               void *buf, uint32_t *size)
+{
+       uint32_t size_remaining = *size;
+       uint32_t cmd_id;
+
+       cmd_id = le32_to_cpu(((uint32_t *)buf)[0]);
+       switch (cmd_id) {
+       case SVGA_CMD_UPDATE:
+               *size = sizeof(uint32_t) + sizeof(SVGAFifoCmdUpdate);
+               break;
+       case SVGA_CMD_DEFINE_GMRFB:
+               *size = sizeof(uint32_t) + sizeof(SVGAFifoCmdDefineGMRFB);
+               break;
+       case SVGA_CMD_BLIT_GMRFB_TO_SCREEN:
+               *size = sizeof(uint32_t) + sizeof(SVGAFifoCmdBlitGMRFBToScreen);
+               break;
+       case SVGA_CMD_BLIT_SCREEN_TO_GMRFB:
+               *size = sizeof(uint32_t) + sizeof(SVGAFifoCmdBlitGMRFBToScreen);
+               break;
+       default:
+               DRM_ERROR("Unsupported SVGA command: %u.\n", cmd_id);
+               return -EINVAL;
+       }
+
+       if (*size > size_remaining) {
+               DRM_ERROR("Invalid SVGA command (size mismatch):"
+                         " %u.\n", cmd_id);
+               return -EINVAL;
+       }
+
+       if (unlikely(!sw_context->kernel)) {
+               DRM_ERROR("Kernel only SVGA command: %u.\n", cmd_id);
+               return -EPERM;
+       }
+
+       if (cmd_id == SVGA_CMD_DEFINE_GMRFB)
+               return vmw_cmd_check_define_gmrfb(dev_priv, sw_context, buf);
+
+       return 0;
+}
  
  typedef int (*vmw_cmd_func) (struct vmw_private *,
                              struct vmw_sw_context *,
@@ -502,11 +802,11 @@ static int vmw_cmd_check(struct vmw_private *dev_priv,
         SVGA3dCmdHeader *header = (SVGA3dCmdHeader *) buf;
         int ret;
  
-       cmd_id = ((uint32_t *)buf)[0];
-       if (cmd_id == SVGA_CMD_UPDATE) {
-               *size = 5 << 2;
-               return 0;
-       }
+       cmd_id = le32_to_cpu(((uint32_t *)buf)[0]);
+       /* Handle any none 3D commands */
+       if (unlikely(cmd_id < SVGA_CMD_MAX))
+               return vmw_cmd_check_not_3d(dev_priv, sw_context, buf, size);
+
  
         cmd_id = le32_to_cpu(header->id);
         *size = le32_to_cpu(header->size) + sizeof(SVGA3dCmdHeader);
@@ -531,9 +831,9 @@ out_err:
  
  static int vmw_cmd_check_all(struct vmw_private *dev_priv,
                              struct vmw_sw_context *sw_context,
+                            void *buf,
                              uint32_t size)
  {
-       void *buf = sw_context->cmd_bounce;
         int32_t cur_size = size;
         int ret;
  
@@ -582,7 +882,7 @@ static void vmw_apply_relocations(struct vmw_sw_context *sw_context)
  static void vmw_clear_validations(struct vmw_sw_context *sw_context)
  {
         struct ttm_validate_buffer *entry, *next;
-       uint32_t i = sw_context->num_ref_resources;
+       struct vmw_resource *res, *res_next;
  
         /*
          * Drop references to DMA buffers held during command submission.
@@ -599,9 +899,11 @@ static void vmw_clear_validations(struct vmw_sw_context *sw_context)
         /*
          * Drop references to resources held during command submission.
          */
-       while (i-- > 0) {
-               sw_context->resources[i]->on_validate_list = false;
-               vmw_resource_unreference(&sw_context->resources[i]);
+       vmw_resource_unreserve(&sw_context->resource_list);
+       list_for_each_entry_safe(res, res_next, &sw_context->resource_list,
+                                validate_head) {
+               list_del_init(&res->validate_head);
+               vmw_resource_unreference(&res);
         }
  }
  
@@ -610,6 +912,16 @@ static int vmw_validate_single_buffer(struct vmw_private *dev_priv,
  {
         int ret;
  
+
+       /*
+        * Don't validate pinned buffers.
+        */
+
+       if (bo == dev_priv->pinned_bo ||
+           (bo == dev_priv->dummy_query_bo &&
+            dev_priv->dummy_query_bo_pinned))
+               return 0;
+
         /**
          * Put BO in VRAM if there is space, otherwise as a GMR.
          * If there is no space in VRAM and GMR ids are all used up,
@@ -724,69 +1036,128 @@ int vmw_execbuf_fence_commands(struct drm_file *file_priv,
         return 0;
  }
  
-int vmw_execbuf_ioctl(struct drm_device *dev, void *data,
-                     struct drm_file *file_priv)
+/**
+ * vmw_execbuf_copy_fence_user - copy fence object information to
+ * user-space.
+ *
+ * @dev_priv: Pointer to a vmw_private struct.
+ * @vmw_fp: Pointer to the struct vmw_fpriv representing the calling file.
+ * @ret: Return value from fence object creation.
+ * @user_fence_rep: User space address of a struct drm_vmw_fence_rep to
+ * which the information should be copied.
+ * @fence: Pointer to the fenc object.
+ * @fence_handle: User-space fence handle.
+ *
+ * This function copies fence information to user-space. If copying fails,
+ * The user-space struct drm_vmw_fence_rep::error member is hopefully
+ * left untouched, and if it's preloaded with an -EFAULT by user-space,
+ * the error will hopefully be detected.
+ * Also if copying fails, user-space will be unable to signal the fence
+ * object so we wait for it immediately, and then unreference the
+ * user-space reference.
+ */
+void
+vmw_execbuf_copy_fence_user(struct vmw_private *dev_priv,
+                           struct vmw_fpriv *vmw_fp,
+                           int ret,
+                           struct drm_vmw_fence_rep __user *user_fence_rep,
+                           struct vmw_fence_obj *fence,
+                           uint32_t fence_handle)
  {
-       struct vmw_private *dev_priv = vmw_priv(dev);
-       struct drm_vmw_execbuf_arg *arg = (struct drm_vmw_execbuf_arg *)data;
         struct drm_vmw_fence_rep fence_rep;
-       struct drm_vmw_fence_rep __user *user_fence_rep;
-       int ret;
-       void *user_cmd;
-       void *cmd;
-       struct vmw_sw_context *sw_context = &dev_priv->ctx;
-       struct vmw_master *vmaster = vmw_master(file_priv->master);
-       struct vmw_fence_obj *fence;
-       uint32_t handle;
+
+       if (user_fence_rep == NULL)
+               return;
+
+       memset(&fence_rep, 0, sizeof(fence_rep));
+
+       fence_rep.error = ret;
+       if (ret == 0) {
+               BUG_ON(fence == NULL);
+
+               fence_rep.handle = fence_handle;
+               fence_rep.seqno = fence->seqno;
+               vmw_update_seqno(dev_priv, &dev_priv->fifo);
+               fence_rep.passed_seqno = dev_priv->last_read_seqno;
+       }
  
         /*
-        * This will allow us to extend the ioctl argument while
-        * maintaining backwards compatibility:
-        * We take different code paths depending on the value of
-        * arg->version.
+        * copy_to_user errors will be detected by user space not
+        * seeing fence_rep::error filled in. Typically
+        * user-space would have pre-set that member to -EFAULT.
          */
+       ret = copy_to_user(user_fence_rep, &fence_rep,
+                          sizeof(fence_rep));
  
-       if (unlikely(arg->version != DRM_VMW_EXECBUF_VERSION)) {
-               DRM_ERROR("Incorrect execbuf version.\n");
-               DRM_ERROR("You're running outdated experimental "
-                         "vmwgfx user-space drivers.");
-               return -EINVAL;
+       /*
+        * User-space lost the fence object. We need to sync
+        * and unreference the handle.
+        */
+       if (unlikely(ret != 0) && (fence_rep.error == 0)) {
+               ttm_ref_object_base_unref(vmw_fp->tfile,
+                                         fence_handle, TTM_REF_USAGE);
+               DRM_ERROR("Fence copy error. Syncing.\n");
+               (void) vmw_fence_obj_wait(fence, fence->signal_mask,
+                                         false, false,
+                                         VMW_FENCE_WAIT_TIMEOUT);
         }
+}
  
-       ret = ttm_read_lock(&vmaster->lock, true);
-       if (unlikely(ret != 0))
-               return ret;
+int vmw_execbuf_process(struct drm_file *file_priv,
+                       struct vmw_private *dev_priv,
+                       void __user *user_commands,
+                       void *kernel_commands,
+                       uint32_t command_size,
+                       uint64_t throttle_us,
+                       struct drm_vmw_fence_rep __user *user_fence_rep,
+                       struct vmw_fence_obj **out_fence)
+{
+       struct vmw_sw_context *sw_context = &dev_priv->ctx;
+       struct vmw_fence_obj *fence = NULL;
+       uint32_t handle;
+       void *cmd;
+       int ret;
  
         ret = mutex_lock_interruptible(&dev_priv->cmdbuf_mutex);
-       if (unlikely(ret != 0)) {
-               ret = -ERESTARTSYS;
-               goto out_no_cmd_mutex;
-       }
-
-       ret = vmw_resize_cmd_bounce(sw_context, arg->command_size);
         if (unlikely(ret != 0))
-               goto out_unlock;
+               return -ERESTARTSYS;
  
-       user_cmd = (void __user *)(unsigned long)arg->commands;
-       ret = copy_from_user(sw_context->cmd_bounce,
-                            user_cmd, arg->command_size);
+       if (kernel_commands == NULL) {
+               sw_context->kernel = false;
  
-       if (unlikely(ret != 0)) {
-               ret = -EFAULT;
-               DRM_ERROR("Failed copying commands.\n");
-               goto out_unlock;
-       }
+               ret = vmw_resize_cmd_bounce(sw_context, command_size);
+               if (unlikely(ret != 0))
+                       goto out_unlock;
+
+
+               ret = copy_from_user(sw_context->cmd_bounce,
+                                    user_commands, command_size);
+
+               if (unlikely(ret != 0)) {
+                       ret = -EFAULT;
+                       DRM_ERROR("Failed copying commands.\n");
+                       goto out_unlock;
+               }
+               kernel_commands = sw_context->cmd_bounce;
+       } else
+               sw_context->kernel = true;
  
         sw_context->tfile = vmw_fpriv(file_priv)->tfile;
         sw_context->cid_valid = false;
         sw_context->sid_valid = false;
         sw_context->cur_reloc = 0;
         sw_context->cur_val_buf = 0;
-       sw_context->num_ref_resources = 0;
+       sw_context->fence_flags = 0;
+       INIT_LIST_HEAD(&sw_context->query_list);
+       INIT_LIST_HEAD(&sw_context->resource_list);
+       sw_context->cur_query_bo = dev_priv->pinned_bo;
+       sw_context->cur_query_cid = dev_priv->query_cid;
+       sw_context->query_cid_valid = (dev_priv->pinned_bo != NULL);
  
         INIT_LIST_HEAD(&sw_context->validate_nodes);
  
-       ret = vmw_cmd_check_all(dev_priv, sw_context, arg->command_size);
+       ret = vmw_cmd_check_all(dev_priv, sw_context, kernel_commands,
+                               command_size);
         if (unlikely(ret != 0))
                 goto out_err;
  
@@ -800,26 +1171,25 @@ int vmw_execbuf_ioctl(struct drm_device *dev, void *data,
  
         vmw_apply_relocations(sw_context);
  
-       if (arg->throttle_us) {
+       if (throttle_us) {
                 ret = vmw_wait_lag(dev_priv, &dev_priv->fifo.marker_queue,
-                                  arg->throttle_us);
+                                  throttle_us);
  
                 if (unlikely(ret != 0))
                         goto out_throttle;
         }
  
-       cmd = vmw_fifo_reserve(dev_priv, arg->command_size);
+       cmd = vmw_fifo_reserve(dev_priv, command_size);
         if (unlikely(cmd == NULL)) {
                 DRM_ERROR("Failed reserving fifo space for commands.\n");
                 ret = -ENOMEM;
-               goto out_err;
+               goto out_throttle;
         }
  
-       memcpy(cmd, sw_context->cmd_bounce, arg->command_size);
-       vmw_fifo_commit(dev_priv, arg->command_size);
+       memcpy(cmd, kernel_commands, command_size);
+       vmw_fifo_commit(dev_priv, command_size);
  
-       user_fence_rep = (struct drm_vmw_fence_rep __user *)
-               (unsigned long)arg->fence_rep;
+       vmw_query_bo_switch_commit(dev_priv, sw_context);
         ret = vmw_execbuf_fence_commands(file_priv, dev_priv,
                                          &fence,
                                          (user_fence_rep) ? &handle : NULL);
@@ -836,54 +1206,177 @@ int vmw_execbuf_ioctl(struct drm_device *dev, void *data,
                                     (void *) fence);
  
         vmw_clear_validations(sw_context);
-       mutex_unlock(&dev_priv->cmdbuf_mutex);
-
-       if (user_fence_rep) {
-               fence_rep.error = ret;
-               fence_rep.handle = handle;
-               fence_rep.seqno = fence->seqno;
-               vmw_update_seqno(dev_priv, &dev_priv->fifo);
-               fence_rep.passed_seqno = dev_priv->last_read_seqno;
-
-               /*
-                * copy_to_user errors will be detected by user space not
-                * seeing fence_rep::error filled in. Typically
-                * user-space would have pre-set that member to -EFAULT.
-                */
-               ret = copy_to_user(user_fence_rep, &fence_rep,
-                                  sizeof(fence_rep));
-
-               /*
-                * User-space lost the fence object. We need to sync
-                * and unreference the handle.
-                */
-               if (unlikely(ret != 0) && (fence_rep.error == 0)) {
-                       BUG_ON(fence == NULL);
-
-                       ttm_ref_object_base_unref(vmw_fpriv(file_priv)->tfile,
-                                                 handle, TTM_REF_USAGE);
-                       DRM_ERROR("Fence copy error. Syncing.\n");
-                       (void) vmw_fence_obj_wait(fence,
-                                                 fence->signal_mask,
-                                                 false, false,
-                                                 VMW_FENCE_WAIT_TIMEOUT);
-               }
-       }
-
-       if (likely(fence != NULL))
+       vmw_execbuf_copy_fence_user(dev_priv, vmw_fpriv(file_priv), ret,
+                                   user_fence_rep, fence, handle);
+
+       /* Don't unreference when handing fence out */
+       if (unlikely(out_fence != NULL)) {
+               *out_fence = fence;
+               fence = NULL;
+       } else if (likely(fence != NULL)) {
                 vmw_fence_obj_unreference(&fence);
+       }
  
-       vmw_kms_cursor_post_execbuf(dev_priv);
-       ttm_read_unlock(&vmaster->lock);
+       mutex_unlock(&dev_priv->cmdbuf_mutex);
         return 0;
+
  out_err:
         vmw_free_relocations(sw_context);
  out_throttle:
+       vmw_query_switch_backoff(sw_context);
         ttm_eu_backoff_reservation(&sw_context->validate_nodes);
         vmw_clear_validations(sw_context);
  out_unlock:
         mutex_unlock(&dev_priv->cmdbuf_mutex);
-out_no_cmd_mutex:
+       return ret;
+}
+
+/**
+ * vmw_execbuf_unpin_panic - Idle the fifo and unpin the query buffer.
+ *
+ * @dev_priv: The device private structure.
+ *
+ * This function is called to idle the fifo and unpin the query buffer
+ * if the normal way to do this hits an error, which should typically be
+ * extremely rare.
+ */
+static void vmw_execbuf_unpin_panic(struct vmw_private *dev_priv)
+{
+       DRM_ERROR("Can't unpin query buffer. Trying to recover.\n");
+
+       (void) vmw_fallback_wait(dev_priv, false, true, 0, false, 10*HZ);
+       vmw_bo_pin(dev_priv->pinned_bo, false);
+       vmw_bo_pin(dev_priv->dummy_query_bo, false);
+       dev_priv->dummy_query_bo_pinned = false;
+}
+
+
+/**
+ * vmw_execbuf_release_pinned_bo - Flush queries and unpin the pinned
+ * query bo.
+ *
+ * @dev_priv: The device private structure.
+ * @only_on_cid_match: Only flush and unpin if the current active query cid
+ * matches @cid.
+ * @cid: Optional context id to match.
+ *
+ * This function should be used to unpin the pinned query bo, or
+ * as a query barrier when we need to make sure that all queries have
+ * finished before the next fifo command. (For example on hardware
+ * context destructions where the hardware may otherwise leak unfinished
+ * queries).
+ *
+ * This function does not return any failure codes, but make attempts
+ * to do safe unpinning in case of errors.
+ *
+ * The function will synchronize on the previous query barrier, and will
+ * thus not finish until that barrier has executed.
+ */
+void vmw_execbuf_release_pinned_bo(struct vmw_private *dev_priv,
+                                  bool only_on_cid_match, uint32_t cid)
+{
+       int ret = 0;
+       struct list_head validate_list;
+       struct ttm_validate_buffer pinned_val, query_val;
+       struct vmw_fence_obj *fence;
+
+       mutex_lock(&dev_priv->cmdbuf_mutex);
+
+       if (dev_priv->pinned_bo == NULL)
+               goto out_unlock;
+
+       if (only_on_cid_match && cid != dev_priv->query_cid)
+               goto out_unlock;
+
+       INIT_LIST_HEAD(&validate_list);
+
+       pinned_val.new_sync_obj_arg = (void *)(unsigned long)
+               DRM_VMW_FENCE_FLAG_EXEC;
+       pinned_val.bo = ttm_bo_reference(dev_priv->pinned_bo);
+       list_add_tail(&pinned_val.head, &validate_list);
+
+       query_val.new_sync_obj_arg = pinned_val.new_sync_obj_arg;
+       query_val.bo = ttm_bo_reference(dev_priv->dummy_query_bo);
+       list_add_tail(&query_val.head, &validate_list);
+
+       do {
+               ret = ttm_eu_reserve_buffers(&validate_list);
+       } while (ret == -ERESTARTSYS);
+
+       if (unlikely(ret != 0)) {
+               vmw_execbuf_unpin_panic(dev_priv);
+               goto out_no_reserve;
+       }
+
+       ret = vmw_fifo_emit_dummy_query(dev_priv, dev_priv->query_cid);
+       if (unlikely(ret != 0)) {
+               vmw_execbuf_unpin_panic(dev_priv);
+               goto out_no_emit;
+       }
+
+       vmw_bo_pin(dev_priv->pinned_bo, false);
+       vmw_bo_pin(dev_priv->dummy_query_bo, false);
+       dev_priv->dummy_query_bo_pinned = false;
+
+       (void) vmw_execbuf_fence_commands(NULL, dev_priv, &fence, NULL);
+       ttm_eu_fence_buffer_objects(&validate_list, (void *) fence);
+
+       ttm_bo_unref(&query_val.bo);
+       ttm_bo_unref(&pinned_val.bo);
+       ttm_bo_unref(&dev_priv->pinned_bo);
+
+out_unlock:
+       mutex_unlock(&dev_priv->cmdbuf_mutex);
+       return;
+
+out_no_emit:
+       ttm_eu_backoff_reservation(&validate_list);
+out_no_reserve:
+       ttm_bo_unref(&query_val.bo);
+       ttm_bo_unref(&pinned_val.bo);
+       ttm_bo_unref(&dev_priv->pinned_bo);
+       mutex_unlock(&dev_priv->cmdbuf_mutex);
+}
+
+
+int vmw_execbuf_ioctl(struct drm_device *dev, void *data,
+                     struct drm_file *file_priv)
+{
+       struct vmw_private *dev_priv = vmw_priv(dev);
+       struct drm_vmw_execbuf_arg *arg = (struct drm_vmw_execbuf_arg *)data;
+       struct vmw_master *vmaster = vmw_master(file_priv->master);
+       int ret;
+
+       /*
+        * This will allow us to extend the ioctl argument while
+        * maintaining backwards compatibility:
+        * We take different code paths depending on the value of
+        * arg->version.
+        */
+
+       if (unlikely(arg->version != DRM_VMW_EXECBUF_VERSION)) {
+               DRM_ERROR("Incorrect execbuf version.\n");
+               DRM_ERROR("You're running outdated experimental "
+                         "vmwgfx user-space drivers.");
+               return -EINVAL;
+       }
+
+       ret = ttm_read_lock(&vmaster->lock, true);
+       if (unlikely(ret != 0))
+               return ret;
+
+       ret = vmw_execbuf_process(file_priv, dev_priv,
+                                 (void __user *)(unsigned long)arg->commands,
+                                 NULL, arg->command_size, arg->throttle_us,
+                                 (void __user *)(unsigned long)arg->fence_rep,
+                                 NULL);
+
+       if (unlikely(ret != 0))
+               goto out_unlock;
+
+       vmw_kms_cursor_post_execbuf(dev_priv);
+
+out_unlock:
         ttm_read_unlock(&vmaster->lock);
         return ret;
  }