Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/ohad/hwspinlock
[pandora-kernel.git] / drivers / gpu / drm / vmwgfx / vmwgfx_drv.c
index bff7932..13afddc 100644 (file)
 #define DRM_IOCTL_VMW_EXECBUF                                  \
        DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_EXECBUF,             \
                struct drm_vmw_execbuf_arg)
-#define DRM_IOCTL_VMW_FIFO_DEBUG                               \
-       DRM_IOWR(DRM_COMMAND_BASE + DRM_VMW_FIFO_DEBUG,         \
-                struct drm_vmw_fifo_debug_arg)
+#define DRM_IOCTL_VMW_GET_3D_CAP                               \
+       DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_GET_3D_CAP,          \
+                struct drm_vmw_get_3d_cap_arg)
 #define DRM_IOCTL_VMW_FENCE_WAIT                               \
        DRM_IOWR(DRM_COMMAND_BASE + DRM_VMW_FENCE_WAIT,         \
                 struct drm_vmw_fence_wait_arg)
-#define DRM_IOCTL_VMW_UPDATE_LAYOUT                            \
-       DRM_IOWR(DRM_COMMAND_BASE + DRM_VMW_UPDATE_LAYOUT,      \
-                struct drm_vmw_update_layout_arg)
-
+#define DRM_IOCTL_VMW_FENCE_SIGNALED                           \
+       DRM_IOWR(DRM_COMMAND_BASE + DRM_VMW_FENCE_SIGNALED,     \
+                struct drm_vmw_fence_signaled_arg)
+#define DRM_IOCTL_VMW_FENCE_UNREF                              \
+       DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_FENCE_UNREF,         \
+                struct drm_vmw_fence_arg)
+#define DRM_IOCTL_VMW_FENCE_EVENT                              \
+       DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_FENCE_EVENT,         \
+                struct drm_vmw_fence_event_arg)
+#define DRM_IOCTL_VMW_PRESENT                                  \
+       DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_PRESENT,             \
+                struct drm_vmw_present_arg)
+#define DRM_IOCTL_VMW_PRESENT_READBACK                         \
+       DRM_IOW(DRM_COMMAND_BASE + DRM_VMW_PRESENT_READBACK,    \
+                struct drm_vmw_present_readback_arg)
 
 /**
  * The core DRM version of this macro doesn't account for
@@ -135,12 +146,25 @@ static struct drm_ioctl_desc vmw_ioctls[] = {
                      DRM_AUTH | DRM_UNLOCKED),
        VMW_IOCTL_DEF(VMW_EXECBUF, vmw_execbuf_ioctl,
                      DRM_AUTH | DRM_UNLOCKED),
-       VMW_IOCTL_DEF(VMW_FIFO_DEBUG, vmw_fifo_debug_ioctl,
-                     DRM_AUTH | DRM_ROOT_ONLY | DRM_MASTER | DRM_UNLOCKED),
-       VMW_IOCTL_DEF(VMW_FENCE_WAIT, vmw_fence_wait_ioctl,
+       VMW_IOCTL_DEF(VMW_FENCE_WAIT, vmw_fence_obj_wait_ioctl,
+                     DRM_AUTH | DRM_UNLOCKED),
+       VMW_IOCTL_DEF(VMW_FENCE_SIGNALED,
+                     vmw_fence_obj_signaled_ioctl,
+                     DRM_AUTH | DRM_UNLOCKED),
+       VMW_IOCTL_DEF(VMW_FENCE_UNREF, vmw_fence_obj_unref_ioctl,
+                     DRM_AUTH | DRM_UNLOCKED),
+       VMW_IOCTL_DEF(VMW_FENCE_EVENT,
+                     vmw_fence_event_ioctl,
+                     DRM_AUTH | DRM_UNLOCKED),
+       VMW_IOCTL_DEF(VMW_GET_3D_CAP, vmw_get_cap_3d_ioctl,
                      DRM_AUTH | DRM_UNLOCKED),
-       VMW_IOCTL_DEF(VMW_UPDATE_LAYOUT, vmw_kms_update_layout_ioctl,
-                     DRM_MASTER | DRM_CONTROL_ALLOW | DRM_UNLOCKED)
+
+       /* these allow direct access to the framebuffers mark as master only */
+       VMW_IOCTL_DEF(VMW_PRESENT, vmw_present_ioctl,
+                     DRM_MASTER | DRM_AUTH | DRM_UNLOCKED),
+       VMW_IOCTL_DEF(VMW_PRESENT_READBACK,
+                     vmw_present_readback_ioctl,
+                     DRM_MASTER | DRM_AUTH | DRM_UNLOCKED),
 };
 
 static struct pci_device_id vmw_pci_id_list[] = {
@@ -195,6 +219,72 @@ static void vmw_print_capabilities(uint32_t capabilities)
                DRM_INFO("  Screen Object 2.\n");
 }
 
+
+/**
+ * vmw_execbuf_prepare_dummy_query - Initialize a query result structure at
+ * the start of a buffer object.
+ *
+ * @dev_priv: The device private structure.
+ *
+ * This function will idle the buffer using an uninterruptible wait, then
+ * map the first page and initialize a pending occlusion query result structure,
+ * Finally it will unmap the buffer.
+ *
+ * TODO: Since we're only mapping a single page, we should optimize the map
+ * to use kmap_atomic / iomap_atomic.
+ */
+static void vmw_dummy_query_bo_prepare(struct vmw_private *dev_priv)
+{
+       struct ttm_bo_kmap_obj map;
+       volatile SVGA3dQueryResult *result;
+       bool dummy;
+       int ret;
+       struct ttm_bo_device *bdev = &dev_priv->bdev;
+       struct ttm_buffer_object *bo = dev_priv->dummy_query_bo;
+
+       ttm_bo_reserve(bo, false, false, false, 0);
+       spin_lock(&bdev->fence_lock);
+       ret = ttm_bo_wait(bo, false, false, false);
+       spin_unlock(&bdev->fence_lock);
+       if (unlikely(ret != 0))
+               (void) vmw_fallback_wait(dev_priv, false, true, 0, false,
+                                        10*HZ);
+
+       ret = ttm_bo_kmap(bo, 0, 1, &map);
+       if (likely(ret == 0)) {
+               result = ttm_kmap_obj_virtual(&map, &dummy);
+               result->totalSize = sizeof(*result);
+               result->state = SVGA3D_QUERYSTATE_PENDING;
+               result->result32 = 0xff;
+               ttm_bo_kunmap(&map);
+       } else
+               DRM_ERROR("Dummy query buffer map failed.\n");
+       ttm_bo_unreserve(bo);
+}
+
+
+/**
+ * vmw_dummy_query_bo_create - create a bo to hold a dummy query result
+ *
+ * @dev_priv: A device private structure.
+ *
+ * This function creates a small buffer object that holds the query
+ * result for dummy queries emitted as query barriers.
+ * No interruptible waits are done within this function.
+ *
+ * Returns an error if bo creation fails.
+ */
+static int vmw_dummy_query_bo_create(struct vmw_private *dev_priv)
+{
+       return ttm_bo_create(&dev_priv->bdev,
+                            PAGE_SIZE,
+                            ttm_bo_type_device,
+                            &vmw_vram_sys_placement,
+                            0, 0, false, NULL,
+                            &dev_priv->dummy_query_bo);
+}
+
+
 static int vmw_request_device(struct vmw_private *dev_priv)
 {
        int ret;
@@ -204,12 +294,31 @@ static int vmw_request_device(struct vmw_private *dev_priv)
                DRM_ERROR("Unable to initialize FIFO.\n");
                return ret;
        }
+       vmw_fence_fifo_up(dev_priv->fman);
+       ret = vmw_dummy_query_bo_create(dev_priv);
+       if (unlikely(ret != 0))
+               goto out_no_query_bo;
+       vmw_dummy_query_bo_prepare(dev_priv);
 
        return 0;
+
+out_no_query_bo:
+       vmw_fence_fifo_down(dev_priv->fman);
+       vmw_fifo_release(dev_priv, &dev_priv->fifo);
+       return ret;
 }
 
 static void vmw_release_device(struct vmw_private *dev_priv)
 {
+       /*
+        * Previous destructions should've released
+        * the pinned bo.
+        */
+
+       BUG_ON(dev_priv->pinned_bo != NULL);
+
+       ttm_bo_unref(&dev_priv->dummy_query_bo);
+       vmw_fence_fifo_down(dev_priv->fman);
        vmw_fifo_release(dev_priv, &dev_priv->fifo);
 }
 
@@ -286,7 +395,7 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
 
        dev_priv->dev = dev;
        dev_priv->vmw_chipset = chipset;
-       dev_priv->last_read_sequence = (uint32_t) -100;
+       dev_priv->last_read_seqno = (uint32_t) -100;
        mutex_init(&dev_priv->hw_mutex);
        mutex_init(&dev_priv->cmdbuf_mutex);
        mutex_init(&dev_priv->release_mutex);
@@ -297,8 +406,10 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
        mutex_init(&dev_priv->init_mutex);
        init_waitqueue_head(&dev_priv->fence_queue);
        init_waitqueue_head(&dev_priv->fifo_queue);
-       atomic_set(&dev_priv->fence_queue_waiters, 0);
+       dev_priv->fence_queue_waiters = 0;
        atomic_set(&dev_priv->fifo_queue_waiters, 0);
+       INIT_LIST_HEAD(&dev_priv->surface_lru);
+       dev_priv->used_memory_size = 0;
 
        dev_priv->io_start = pci_resource_start(dev->pdev, 0);
        dev_priv->vram_start = pci_resource_start(dev->pdev, 1);
@@ -319,6 +430,10 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
 
        dev_priv->capabilities = vmw_read(dev_priv, SVGA_REG_CAPABILITIES);
 
+       dev_priv->vram_size = vmw_read(dev_priv, SVGA_REG_VRAM_SIZE);
+       dev_priv->mmio_size = vmw_read(dev_priv, SVGA_REG_MEM_SIZE);
+       dev_priv->fb_max_width = vmw_read(dev_priv, SVGA_REG_MAX_WIDTH);
+       dev_priv->fb_max_height = vmw_read(dev_priv, SVGA_REG_MAX_HEIGHT);
        if (dev_priv->capabilities & SVGA_CAP_GMR) {
                dev_priv->max_gmr_descriptors =
                        vmw_read(dev_priv,
@@ -331,13 +446,15 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
                        vmw_read(dev_priv, SVGA_REG_GMRS_MAX_PAGES);
                dev_priv->memory_size =
                        vmw_read(dev_priv, SVGA_REG_MEMORY_SIZE);
+               dev_priv->memory_size -= dev_priv->vram_size;
+       } else {
+               /*
+                * An arbitrary limit of 512MiB on surface
+                * memory. But all HWV8 hardware supports GMR2.
+                */
+               dev_priv->memory_size = 512*1024*1024;
        }
 
-       dev_priv->vram_size = vmw_read(dev_priv, SVGA_REG_VRAM_SIZE);
-       dev_priv->mmio_size = vmw_read(dev_priv, SVGA_REG_MEM_SIZE);
-       dev_priv->fb_max_width = vmw_read(dev_priv, SVGA_REG_MAX_WIDTH);
-       dev_priv->fb_max_height = vmw_read(dev_priv, SVGA_REG_MAX_HEIGHT);
-
        mutex_unlock(&dev_priv->hw_mutex);
 
        vmw_print_capabilities(dev_priv->capabilities);
@@ -351,8 +468,8 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
        if (dev_priv->capabilities & SVGA_CAP_GMR2) {
                DRM_INFO("Max number of GMR pages is %u\n",
                         (unsigned)dev_priv->max_gmr_pages);
-               DRM_INFO("Max dedicated hypervisor graphics memory is %u\n",
-                        (unsigned)dev_priv->memory_size);
+               DRM_INFO("Max dedicated hypervisor surface memory is %u kiB\n",
+                        (unsigned)dev_priv->memory_size / 1024);
        }
        DRM_INFO("VRAM at 0x%08x size is %u kiB\n",
                 dev_priv->vram_start, dev_priv->vram_size / 1024);
@@ -440,22 +557,34 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
                        goto out_no_device;
                }
        }
+
+       dev_priv->fman = vmw_fence_manager_init(dev_priv);
+       if (unlikely(dev_priv->fman == NULL))
+               goto out_no_fman;
+
+       /* Need to start the fifo to check if we can do screen objects */
+       ret = vmw_3d_resource_inc(dev_priv, true);
+       if (unlikely(ret != 0))
+               goto out_no_fifo;
+       vmw_kms_save_vga(dev_priv);
+
+       /* Start kms and overlay systems, needs fifo. */
        ret = vmw_kms_init(dev_priv);
        if (unlikely(ret != 0))
                goto out_no_kms;
        vmw_overlay_init(dev_priv);
+
+       /* 3D Depends on Screen Objects being used. */
+       DRM_INFO("Detected %sdevice 3D availability.\n",
+                vmw_fifo_have_3d(dev_priv) ?
+                "" : "no ");
+
+       /* We might be done with the fifo now */
        if (dev_priv->enable_fb) {
-               ret = vmw_3d_resource_inc(dev_priv, false);
-               if (unlikely(ret != 0))
-                       goto out_no_fifo;
-               vmw_kms_save_vga(dev_priv);
                vmw_fb_init(dev_priv);
-               DRM_INFO("%s", vmw_fifo_have_3d(dev_priv) ?
-                        "Detected device 3D availability.\n" :
-                        "Detected no device 3D availability.\n");
        } else {
-               DRM_INFO("Delayed 3D detection since we're not "
-                        "running the device in SVGA mode yet.\n");
+               vmw_kms_restore_vga(dev_priv);
+               vmw_3d_resource_dec(dev_priv, true);
        }
 
        if (dev_priv->capabilities & SVGA_CAP_IRQMASK) {
@@ -472,15 +601,19 @@ static int vmw_driver_load(struct drm_device *dev, unsigned long chipset)
        return 0;
 
 out_no_irq:
-       if (dev_priv->enable_fb) {
+       if (dev_priv->enable_fb)
                vmw_fb_close(dev_priv);
+       vmw_overlay_close(dev_priv);
+       vmw_kms_close(dev_priv);
+out_no_kms:
+       /* We still have a 3D resource reference held */
+       if (dev_priv->enable_fb) {
                vmw_kms_restore_vga(dev_priv);
                vmw_3d_resource_dec(dev_priv, false);
        }
 out_no_fifo:
-       vmw_overlay_close(dev_priv);
-       vmw_kms_close(dev_priv);
-out_no_kms:
+       vmw_fence_manager_takedown(dev_priv->fman);
+out_no_fman:
        if (dev_priv->stealth)
                pci_release_region(dev->pdev, 2);
        else
@@ -524,6 +657,7 @@ static int vmw_driver_unload(struct drm_device *dev)
        }
        vmw_kms_close(dev_priv);
        vmw_overlay_close(dev_priv);
+       vmw_fence_manager_takedown(dev_priv->fman);
        if (dev_priv->stealth)
                pci_release_region(dev->pdev, 2);
        else
@@ -757,7 +891,7 @@ static void vmw_master_drop(struct drm_device *dev,
 
        vmw_fp->locked_master = drm_master_get(file_priv->master);
        ret = ttm_vt_lock(&vmaster->lock, false, vmw_fp->tfile);
-       vmw_kms_idle_workqueues(vmaster);
+       vmw_execbuf_release_pinned_bo(dev_priv, false, 0);
 
        if (unlikely((ret != 0))) {
                DRM_ERROR("Unable to lock TTM at VT switch.\n");
@@ -809,6 +943,7 @@ static int vmwgfx_pm_notifier(struct notifier_block *nb, unsigned long val,
                 * This empties VRAM and unbinds all GMR bindings.
                 * Buffer contents is moved to swappable memory.
                 */
+               vmw_execbuf_release_pinned_bo(dev_priv, false, 0);
                ttm_bo_swapout_all(&dev_priv->bdev);
 
                break;
@@ -934,6 +1069,8 @@ static struct drm_driver driver = {
        .irq_uninstall = vmw_irq_uninstall,
        .irq_handler = vmw_irq_handler,
        .get_vblank_counter = vmw_get_vblank_counter,
+       .enable_vblank = vmw_enable_vblank,
+       .disable_vblank = vmw_disable_vblank,
        .reclaim_buffers_locked = NULL,
        .ioctls = vmw_ioctls,
        .num_ioctls = DRM_ARRAY_SIZE(vmw_ioctls),
@@ -950,7 +1087,8 @@ static struct drm_driver driver = {
                 .release = drm_release,
                 .unlocked_ioctl = vmw_unlocked_ioctl,
                 .mmap = vmw_mmap,
-                .poll = drm_poll,
+                .poll = vmw_fops_poll,
+                .read = vmw_fops_read,
                 .fasync = drm_fasync,
 #if defined(CONFIG_COMPAT)
                 .compat_ioctl = drm_compat_ioctl,