sched_fence.c 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173
  1. /*
  2. * Copyright 2015 Advanced Micro Devices, Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. *
  23. */
  24. #include <linux/kthread.h>
  25. #include <linux/wait.h>
  26. #include <linux/sched.h>
  27. #include <drm/drmP.h>
  28. #include "gpu_scheduler.h"
  29. static struct kmem_cache *sched_fence_slab;
  30. int amd_sched_fence_slab_init(void)
  31. {
  32. sched_fence_slab = kmem_cache_create(
  33. "amd_sched_fence", sizeof(struct amd_sched_fence), 0,
  34. SLAB_HWCACHE_ALIGN, NULL);
  35. if (!sched_fence_slab)
  36. return -ENOMEM;
  37. return 0;
  38. }
  39. void amd_sched_fence_slab_fini(void)
  40. {
  41. rcu_barrier();
  42. kmem_cache_destroy(sched_fence_slab);
  43. }
  44. struct amd_sched_fence *amd_sched_fence_create(struct amd_sched_entity *entity,
  45. void *owner)
  46. {
  47. struct amd_sched_fence *fence = NULL;
  48. unsigned seq;
  49. fence = kmem_cache_zalloc(sched_fence_slab, GFP_KERNEL);
  50. if (fence == NULL)
  51. return NULL;
  52. fence->owner = owner;
  53. fence->sched = entity->sched;
  54. spin_lock_init(&fence->lock);
  55. seq = atomic_inc_return(&entity->fence_seq);
  56. dma_fence_init(&fence->scheduled, &amd_sched_fence_ops_scheduled,
  57. &fence->lock, entity->fence_context, seq);
  58. dma_fence_init(&fence->finished, &amd_sched_fence_ops_finished,
  59. &fence->lock, entity->fence_context + 1, seq);
  60. return fence;
  61. }
  62. void amd_sched_fence_scheduled(struct amd_sched_fence *fence)
  63. {
  64. int ret = dma_fence_signal(&fence->scheduled);
  65. if (!ret)
  66. DMA_FENCE_TRACE(&fence->scheduled,
  67. "signaled from irq context\n");
  68. else
  69. DMA_FENCE_TRACE(&fence->scheduled,
  70. "was already signaled\n");
  71. }
  72. void amd_sched_fence_finished(struct amd_sched_fence *fence)
  73. {
  74. int ret = dma_fence_signal(&fence->finished);
  75. if (!ret)
  76. DMA_FENCE_TRACE(&fence->finished,
  77. "signaled from irq context\n");
  78. else
  79. DMA_FENCE_TRACE(&fence->finished,
  80. "was already signaled\n");
  81. }
  82. static const char *amd_sched_fence_get_driver_name(struct dma_fence *fence)
  83. {
  84. return "amd_sched";
  85. }
  86. static const char *amd_sched_fence_get_timeline_name(struct dma_fence *f)
  87. {
  88. struct amd_sched_fence *fence = to_amd_sched_fence(f);
  89. return (const char *)fence->sched->name;
  90. }
  91. static bool amd_sched_fence_enable_signaling(struct dma_fence *f)
  92. {
  93. return true;
  94. }
  95. /**
  96. * amd_sched_fence_free - free up the fence memory
  97. *
  98. * @rcu: RCU callback head
  99. *
  100. * Free up the fence memory after the RCU grace period.
  101. */
  102. static void amd_sched_fence_free(struct rcu_head *rcu)
  103. {
  104. struct dma_fence *f = container_of(rcu, struct dma_fence, rcu);
  105. struct amd_sched_fence *fence = to_amd_sched_fence(f);
  106. dma_fence_put(fence->parent);
  107. kmem_cache_free(sched_fence_slab, fence);
  108. }
  109. /**
  110. * amd_sched_fence_release_scheduled - callback that fence can be freed
  111. *
  112. * @fence: fence
  113. *
  114. * This function is called when the reference count becomes zero.
  115. * It just RCU schedules freeing up the fence.
  116. */
  117. static void amd_sched_fence_release_scheduled(struct dma_fence *f)
  118. {
  119. struct amd_sched_fence *fence = to_amd_sched_fence(f);
  120. call_rcu(&fence->finished.rcu, amd_sched_fence_free);
  121. }
  122. /**
  123. * amd_sched_fence_release_finished - drop extra reference
  124. *
  125. * @f: fence
  126. *
  127. * Drop the extra reference from the scheduled fence to the base fence.
  128. */
  129. static void amd_sched_fence_release_finished(struct dma_fence *f)
  130. {
  131. struct amd_sched_fence *fence = to_amd_sched_fence(f);
  132. dma_fence_put(&fence->scheduled);
  133. }
  134. const struct dma_fence_ops amd_sched_fence_ops_scheduled = {
  135. .get_driver_name = amd_sched_fence_get_driver_name,
  136. .get_timeline_name = amd_sched_fence_get_timeline_name,
  137. .enable_signaling = amd_sched_fence_enable_signaling,
  138. .signaled = NULL,
  139. .wait = dma_fence_default_wait,
  140. .release = amd_sched_fence_release_scheduled,
  141. };
  142. const struct dma_fence_ops amd_sched_fence_ops_finished = {
  143. .get_driver_name = amd_sched_fence_get_driver_name,
  144. .get_timeline_name = amd_sched_fence_get_timeline_name,
  145. .enable_signaling = amd_sched_fence_enable_signaling,
  146. .signaled = NULL,
  147. .wait = dma_fence_default_wait,
  148. .release = amd_sched_fence_release_finished,
  149. };