Subversion Repositories Kolibri OS

Rev

Rev 3480 | Rev 4104 | Go to most recent revision | Blame | Compare with Previous | Last modification | View Log | Download | RSS feed

  1. /*
  2.  * Copyright © 2011-2012 Intel Corporation
  3.  *
  4.  * Permission is hereby granted, free of charge, to any person obtaining a
  5.  * copy of this software and associated documentation files (the "Software"),
  6.  * to deal in the Software without restriction, including without limitation
  7.  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8.  * and/or sell copies of the Software, and to permit persons to whom the
  9.  * Software is furnished to do so, subject to the following conditions:
  10.  *
  11.  * The above copyright notice and this permission notice (including the next
  12.  * paragraph) shall be included in all copies or substantial portions of the
  13.  * Software.
  14.  *
  15.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16.  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17.  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  18.  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19.  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20.  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21.  * IN THE SOFTWARE.
  22.  *
  23.  * Authors:
  24.  *    Ben Widawsky <ben@bwidawsk.net>
  25.  *
  26.  */
  27.  
  28. /*
  29.  * This file implements HW context support. On gen5+ a HW context consists of an
  30.  * opaque GPU object which is referenced at times of context saves and restores.
  31.  * With RC6 enabled, the context is also referenced as the GPU enters and exists
  32.  * from RC6 (GPU has it's own internal power context, except on gen5). Though
  33.  * something like a context does exist for the media ring, the code only
  34.  * supports contexts for the render ring.
  35.  *
  36.  * In software, there is a distinction between contexts created by the user,
  37.  * and the default HW context. The default HW context is used by GPU clients
  38.  * that do not request setup of their own hardware context. The default
  39.  * context's state is never restored to help prevent programming errors. This
  40.  * would happen if a client ran and piggy-backed off another clients GPU state.
  41.  * The default context only exists to give the GPU some offset to load as the
  42.  * current to invoke a save of the context we actually care about. In fact, the
  43.  * code could likely be constructed, albeit in a more complicated fashion, to
  44.  * never use the default context, though that limits the driver's ability to
  45.  * swap out, and/or destroy other contexts.
  46.  *
  47.  * All other contexts are created as a request by the GPU client. These contexts
  48.  * store GPU state, and thus allow GPU clients to not re-emit state (and
  49.  * potentially query certain state) at any time. The kernel driver makes
  50.  * certain that the appropriate commands are inserted.
  51.  *
  52.  * The context life cycle is semi-complicated in that context BOs may live
  53.  * longer than the context itself because of the way the hardware, and object
  54.  * tracking works. Below is a very crude representation of the state machine
  55.  * describing the context life.
  56.  *                                         refcount     pincount     active
  57.  * S0: initial state                          0            0           0
  58.  * S1: context created                        1            0           0
  59.  * S2: context is currently running           2            1           X
  60.  * S3: GPU referenced, but not current        2            0           1
  61.  * S4: context is current, but destroyed      1            1           0
  62.  * S5: like S3, but destroyed                 1            0           1
  63.  *
  64.  * The most common (but not all) transitions:
  65.  * S0->S1: client creates a context
  66.  * S1->S2: client submits execbuf with context
  67.  * S2->S3: other clients submits execbuf with context
  68.  * S3->S1: context object was retired
  69.  * S3->S2: clients submits another execbuf
  70.  * S2->S4: context destroy called with current context
  71.  * S3->S5->S0: destroy path
  72.  * S4->S5->S0: destroy path on current context
  73.  *
  74.  * There are two confusing terms used above:
  75.  *  The "current context" means the context which is currently running on the
  76.  *  GPU. The GPU has loaded it's state already and has stored away the gtt
  77.  *  offset of the BO. The GPU is not actively referencing the data at this
  78.  *  offset, but it will on the next context switch. The only way to avoid this
  79.  *  is to do a GPU reset.
  80.  *
  81.  *  An "active context' is one which was previously the "current context" and is
  82.  *  on the active list waiting for the next context switch to occur. Until this
  83.  *  happens, the object must remain at the same gtt offset. It is therefore
  84.  *  possible to destroy a context, but it is still active.
  85.  *
  86.  */
  87.  
  88. #include <drm/drmP.h>
  89. #include <drm/i915_drm.h>
  90. #include "i915_drv.h"
  91.  
  92. /* This is a HW constraint. The value below is the largest known requirement
  93.  * I've seen in a spec to date, and that was a workaround for a non-shipping
  94.  * part. It should be safe to decrease this, but it's more future proof as is.
  95.  */
  96. #define CONTEXT_ALIGN (64<<10)
  97.  
  98. static struct i915_hw_context *
  99. i915_gem_context_get(struct drm_i915_file_private *file_priv, u32 id);
  100. static int do_switch(struct i915_hw_context *to);
  101.  
  102. static int get_context_size(struct drm_device *dev)
  103. {
  104.         struct drm_i915_private *dev_priv = dev->dev_private;
  105.         int ret;
  106.         u32 reg;
  107.  
  108.         switch (INTEL_INFO(dev)->gen) {
  109.         case 6:
  110.                 reg = I915_READ(CXT_SIZE);
  111.                 ret = GEN6_CXT_TOTAL_SIZE(reg) * 64;
  112.                 break;
  113.         case 7:
  114.                 reg = I915_READ(GEN7_CXT_SIZE);
  115.                 if (IS_HASWELL(dev))
  116.                         ret = HSW_CXT_TOTAL_SIZE(reg) * 64;
  117.                 else
  118.                         ret = GEN7_CXT_TOTAL_SIZE(reg) * 64;
  119.                 break;
  120.         default:
  121.                 BUG();
  122.         }
  123.  
  124.         return ret;
  125. }
  126.  
  127. static void do_destroy(struct i915_hw_context *ctx)
  128. {
  129.         if (ctx->file_priv)
  130.                 idr_remove(&ctx->file_priv->context_idr, ctx->id);
  131.  
  132.         drm_gem_object_unreference(&ctx->obj->base);
  133.         kfree(ctx);
  134. }
  135.  
  136. static struct i915_hw_context *
  137. create_hw_context(struct drm_device *dev,
  138.                   struct drm_i915_file_private *file_priv)
  139. {
  140.         struct drm_i915_private *dev_priv = dev->dev_private;
  141.         struct i915_hw_context *ctx;
  142.         int ret;
  143.  
  144.         ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
  145.         if (ctx == NULL)
  146.                 return ERR_PTR(-ENOMEM);
  147.  
  148.         ctx->obj = i915_gem_alloc_object(dev, dev_priv->hw_context_size);
  149.         if (ctx->obj == NULL) {
  150.                 kfree(ctx);
  151.                 DRM_DEBUG_DRIVER("Context object allocated failed\n");
  152.                 return ERR_PTR(-ENOMEM);
  153.         }
  154.  
  155.         if (INTEL_INFO(dev)->gen >= 7) {
  156.                 ret = i915_gem_object_set_cache_level(ctx->obj,
  157.                                                       I915_CACHE_LLC_MLC);
  158.                 if (ret)
  159.                         goto err_out;
  160.         }
  161.  
  162.         /* The ring associated with the context object is handled by the normal
  163.          * object tracking code. We give an initial ring value simple to pass an
  164.          * assertion in the context switch code.
  165.          */
  166.         ctx->ring = &dev_priv->ring[RCS];
  167.  
  168.         /* Default context will never have a file_priv */
  169.         if (file_priv == NULL)
  170.                 return ctx;
  171.  
  172.         ctx->file_priv = file_priv;
  173.  
  174.         ret = idr_alloc(&file_priv->context_idr, ctx, DEFAULT_CONTEXT_ID + 1, 0,
  175.                         GFP_KERNEL);
  176.         if (ret < 0)
  177.                 goto err_out;
  178.         ctx->id = ret;
  179.  
  180.         return ctx;
  181.  
  182. err_out:
  183.         do_destroy(ctx);
  184.         return ERR_PTR(ret);
  185. }
  186.  
  187. static inline bool is_default_context(struct i915_hw_context *ctx)
  188. {
  189.         return (ctx == ctx->ring->default_context);
  190. }
  191.  
  192. /**
  193.  * The default context needs to exist per ring that uses contexts. It stores the
  194.  * context state of the GPU for applications that don't utilize HW contexts, as
  195.  * well as an idle case.
  196.  */
  197. static int create_default_context(struct drm_i915_private *dev_priv)
  198. {
  199.         struct i915_hw_context *ctx;
  200.         int ret;
  201.  
  202.         BUG_ON(!mutex_is_locked(&dev_priv->dev->struct_mutex));
  203.  
  204.         ctx = create_hw_context(dev_priv->dev, NULL);
  205.         if (IS_ERR(ctx))
  206.                 return PTR_ERR(ctx);
  207.  
  208.         /* We may need to do things with the shrinker which require us to
  209.          * immediately switch back to the default context. This can cause a
  210.          * problem as pinning the default context also requires GTT space which
  211.          * may not be available. To avoid this we always pin the
  212.          * default context.
  213.          */
  214.         dev_priv->ring[RCS].default_context = ctx;
  215.         ret = i915_gem_object_pin(ctx->obj, CONTEXT_ALIGN, false, false);
  216.         if (ret)
  217.                 goto err_destroy;
  218.  
  219.         ret = do_switch(ctx);
  220.         if (ret)
  221.                 goto err_unpin;
  222.  
  223.         DRM_DEBUG_DRIVER("Default HW context loaded\n");
  224.         return 0;
  225.  
  226. err_unpin:
  227.         i915_gem_object_unpin(ctx->obj);
  228. err_destroy:
  229.         do_destroy(ctx);
  230.         return ret;
  231. }
  232.  
  233. void i915_gem_context_init(struct drm_device *dev)
  234. {
  235.         struct drm_i915_private *dev_priv = dev->dev_private;
  236.  
  237.         if (!HAS_HW_CONTEXTS(dev)) {
  238.                 dev_priv->hw_contexts_disabled = true;
  239.                 return;
  240.         }
  241.  
  242.         /* If called from reset, or thaw... we've been here already */
  243.         if (dev_priv->hw_contexts_disabled ||
  244.             dev_priv->ring[RCS].default_context)
  245.                 return;
  246.  
  247.         dev_priv->hw_context_size = round_up(get_context_size(dev), 4096);
  248.  
  249.         if (dev_priv->hw_context_size > (1<<20)) {
  250.                 dev_priv->hw_contexts_disabled = true;
  251.                 return;
  252.         }
  253.  
  254.         if (create_default_context(dev_priv)) {
  255.                 dev_priv->hw_contexts_disabled = true;
  256.                 return;
  257.         }
  258.  
  259.         DRM_DEBUG_DRIVER("HW context support initialized\n");
  260. }
  261.  
  262. void i915_gem_context_fini(struct drm_device *dev)
  263. {
  264.         struct drm_i915_private *dev_priv = dev->dev_private;
  265.  
  266.         if (dev_priv->hw_contexts_disabled)
  267.                 return;
  268.  
  269.         /* The only known way to stop the gpu from accessing the hw context is
  270.          * to reset it. Do this as the very last operation to avoid confusing
  271.          * other code, leading to spurious errors. */
  272. //      intel_gpu_reset(dev);
  273.  
  274.         i915_gem_object_unpin(dev_priv->ring[RCS].default_context->obj);
  275.  
  276.         do_destroy(dev_priv->ring[RCS].default_context);
  277. }
  278.  
  279. static int context_idr_cleanup(int id, void *p, void *data)
  280. {
  281.         struct i915_hw_context *ctx = p;
  282.  
  283.         BUG_ON(id == DEFAULT_CONTEXT_ID);
  284.  
  285.         do_destroy(ctx);
  286.  
  287.         return 0;
  288. }
  289.  
  290. void i915_gem_context_close(struct drm_device *dev, struct drm_file *file)
  291. {
  292.         struct drm_i915_file_private *file_priv = file->driver_priv;
  293.  
  294.         mutex_lock(&dev->struct_mutex);
  295. //      idr_for_each(&file_priv->context_idr, context_idr_cleanup, NULL);
  296.         idr_destroy(&file_priv->context_idr);
  297.         mutex_unlock(&dev->struct_mutex);
  298. }
  299.  
  300. static struct i915_hw_context *
  301. i915_gem_context_get(struct drm_i915_file_private *file_priv, u32 id)
  302. {
  303.         return (struct i915_hw_context *)idr_find(&file_priv->context_idr, id);
  304. }
  305.  
  306. static inline int
  307. mi_set_context(struct intel_ring_buffer *ring,
  308.                struct i915_hw_context *new_context,
  309.                u32 hw_flags)
  310. {
  311.         int ret;
  312.  
  313.         /* w/a: If Flush TLB Invalidation Mode is enabled, driver must do a TLB
  314.          * invalidation prior to MI_SET_CONTEXT. On GEN6 we don't set the value
  315.          * explicitly, so we rely on the value at ring init, stored in
  316.          * itlb_before_ctx_switch.
  317.          */
  318.         if (IS_GEN6(ring->dev) && ring->itlb_before_ctx_switch) {
  319.                 ret = ring->flush(ring, I915_GEM_GPU_DOMAINS, 0);
  320.                 if (ret)
  321.                         return ret;
  322.         }
  323.  
  324.         ret = intel_ring_begin(ring, 6);
  325.         if (ret)
  326.                 return ret;
  327.  
  328.         if (IS_GEN7(ring->dev))
  329.                 intel_ring_emit(ring, MI_ARB_ON_OFF | MI_ARB_DISABLE);
  330.         else
  331.                 intel_ring_emit(ring, MI_NOOP);
  332.  
  333.         intel_ring_emit(ring, MI_NOOP);
  334.         intel_ring_emit(ring, MI_SET_CONTEXT);
  335.         intel_ring_emit(ring, new_context->obj->gtt_offset |
  336.                         MI_MM_SPACE_GTT |
  337.                         MI_SAVE_EXT_STATE_EN |
  338.                         MI_RESTORE_EXT_STATE_EN |
  339.                         hw_flags);
  340.         /* w/a: MI_SET_CONTEXT must always be followed by MI_NOOP */
  341.         intel_ring_emit(ring, MI_NOOP);
  342.  
  343.         if (IS_GEN7(ring->dev))
  344.                 intel_ring_emit(ring, MI_ARB_ON_OFF | MI_ARB_ENABLE);
  345.         else
  346.                 intel_ring_emit(ring, MI_NOOP);
  347.  
  348.         intel_ring_advance(ring);
  349.  
  350.         return ret;
  351. }
  352.  
  353. static int do_switch(struct i915_hw_context *to)
  354. {
  355.         struct intel_ring_buffer *ring = to->ring;
  356.         struct drm_i915_gem_object *from_obj = ring->last_context_obj;
  357.         u32 hw_flags = 0;
  358.         int ret;
  359.  
  360.         BUG_ON(from_obj != NULL && from_obj->pin_count == 0);
  361.  
  362.         if (from_obj == to->obj)
  363.                 return 0;
  364.  
  365.         ret = i915_gem_object_pin(to->obj, CONTEXT_ALIGN, false, false);
  366.         if (ret)
  367.                 return ret;
  368.  
  369.         /* Clear this page out of any CPU caches for coherent swap-in/out. Note
  370.          * that thanks to write = false in this call and us not setting any gpu
  371.          * write domains when putting a context object onto the active list
  372.          * (when switching away from it), this won't block.
  373.          * XXX: We need a real interface to do this instead of trickery. */
  374.         ret = i915_gem_object_set_to_gtt_domain(to->obj, false);
  375.         if (ret) {
  376.                 i915_gem_object_unpin(to->obj);
  377.                 return ret;
  378.         }
  379.  
  380.         if (!to->obj->has_global_gtt_mapping)
  381.                 i915_gem_gtt_bind_object(to->obj, to->obj->cache_level);
  382.  
  383.         if (!to->is_initialized || is_default_context(to))
  384.                 hw_flags |= MI_RESTORE_INHIBIT;
  385.         else if (WARN_ON_ONCE(from_obj == to->obj)) /* not yet expected */
  386.                 hw_flags |= MI_FORCE_RESTORE;
  387.  
  388.         ret = mi_set_context(ring, to, hw_flags);
  389.         if (ret) {
  390.                 i915_gem_object_unpin(to->obj);
  391.                 return ret;
  392.         }
  393.  
  394.         /* The backing object for the context is done after switching to the
  395.          * *next* context. Therefore we cannot retire the previous context until
  396.          * the next context has already started running. In fact, the below code
  397.          * is a bit suboptimal because the retiring can occur simply after the
  398.          * MI_SET_CONTEXT instead of when the next seqno has completed.
  399.          */
  400.         if (from_obj != NULL) {
  401.                 from_obj->base.read_domains = I915_GEM_DOMAIN_INSTRUCTION;
  402.                 i915_gem_object_move_to_active(from_obj, ring);
  403.                 /* As long as MI_SET_CONTEXT is serializing, ie. it flushes the
  404.                  * whole damn pipeline, we don't need to explicitly mark the
  405.                  * object dirty. The only exception is that the context must be
  406.                  * correct in case the object gets swapped out. Ideally we'd be
  407.                  * able to defer doing this until we know the object would be
  408.                  * swapped, but there is no way to do that yet.
  409.                  */
  410.                 from_obj->dirty = 1;
  411.                 BUG_ON(from_obj->ring != ring);
  412.                 i915_gem_object_unpin(from_obj);
  413.  
  414.                 drm_gem_object_unreference(&from_obj->base);
  415.         }
  416.  
  417.         drm_gem_object_reference(&to->obj->base);
  418.         ring->last_context_obj = to->obj;
  419.         to->is_initialized = true;
  420.  
  421.         return 0;
  422. }
  423.  
  424. /**
  425.  * i915_switch_context() - perform a GPU context switch.
  426.  * @ring: ring for which we'll execute the context switch
  427.  * @file_priv: file_priv associated with the context, may be NULL
  428.  * @id: context id number
  429.  * @seqno: sequence number by which the new context will be switched to
  430.  * @flags:
  431.  *
  432.  * The context life cycle is simple. The context refcount is incremented and
  433.  * decremented by 1 and create and destroy. If the context is in use by the GPU,
  434.  * it will have a refoucnt > 1. This allows us to destroy the context abstract
  435.  * object while letting the normal object tracking destroy the backing BO.
  436.  */
  437. int i915_switch_context(struct intel_ring_buffer *ring,
  438.                         struct drm_file *file,
  439.                         int to_id)
  440. {
  441.         struct drm_i915_private *dev_priv = ring->dev->dev_private;
  442.         struct i915_hw_context *to;
  443.  
  444.         if (dev_priv->hw_contexts_disabled)
  445.                 return 0;
  446.  
  447.         if (ring != &dev_priv->ring[RCS])
  448.                 return 0;
  449.  
  450.         if (to_id == DEFAULT_CONTEXT_ID) {
  451.                 to = ring->default_context;
  452.         } else {
  453.                 if (file == NULL)
  454.                         return -EINVAL;
  455.  
  456.                 to = i915_gem_context_get(file->driver_priv, to_id);
  457.                 if (to == NULL)
  458.                         return -ENOENT;
  459.         }
  460.  
  461.         return do_switch(to);
  462. }
  463.  
  464. #if 0
  465. int i915_gem_context_create_ioctl(struct drm_device *dev, void *data,
  466.                                   struct drm_file *file)
  467. {
  468.         struct drm_i915_private *dev_priv = dev->dev_private;
  469.         struct drm_i915_gem_context_create *args = data;
  470.         struct drm_i915_file_private *file_priv = file->driver_priv;
  471.         struct i915_hw_context *ctx;
  472.         int ret;
  473.  
  474.         if (!(dev->driver->driver_features & DRIVER_GEM))
  475.                 return -ENODEV;
  476.  
  477.         if (dev_priv->hw_contexts_disabled)
  478.                 return -ENODEV;
  479.  
  480.         ret = i915_mutex_lock_interruptible(dev);
  481.         if (ret)
  482.                 return ret;
  483.  
  484.         ctx = create_hw_context(dev, file_priv);
  485.         mutex_unlock(&dev->struct_mutex);
  486.         if (IS_ERR(ctx))
  487.                 return PTR_ERR(ctx);
  488.  
  489.         args->ctx_id = ctx->id;
  490.         DRM_DEBUG_DRIVER("HW context %d created\n", args->ctx_id);
  491.  
  492.         return 0;
  493. }
  494.  
  495. int i915_gem_context_destroy_ioctl(struct drm_device *dev, void *data,
  496.                                    struct drm_file *file)
  497. {
  498.         struct drm_i915_gem_context_destroy *args = data;
  499.         struct drm_i915_file_private *file_priv = file->driver_priv;
  500.         struct i915_hw_context *ctx;
  501.         int ret;
  502.  
  503.         if (!(dev->driver->driver_features & DRIVER_GEM))
  504.                 return -ENODEV;
  505.  
  506.         ret = i915_mutex_lock_interruptible(dev);
  507.         if (ret)
  508.                 return ret;
  509.  
  510.         ctx = i915_gem_context_get(file_priv, args->ctx_id);
  511.         if (!ctx) {
  512.                 mutex_unlock(&dev->struct_mutex);
  513.                 return -ENOENT;
  514.         }
  515.  
  516.         do_destroy(ctx);
  517.  
  518.         mutex_unlock(&dev->struct_mutex);
  519.  
  520.         DRM_DEBUG_DRIVER("HW context %d destroyed\n", args->ctx_id);
  521.         return 0;
  522. }
  523.  
  524. #endif
  525.