huge_pages.c 39 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772
  1. /*
  2. * Copyright © 2017 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. */
  24. #include "../i915_selftest.h"
  25. #include <linux/prime_numbers.h>
  26. #include "mock_drm.h"
  27. #include "i915_random.h"
  28. static const unsigned int page_sizes[] = {
  29. I915_GTT_PAGE_SIZE_2M,
  30. I915_GTT_PAGE_SIZE_64K,
  31. I915_GTT_PAGE_SIZE_4K,
  32. };
  33. static unsigned int get_largest_page_size(struct drm_i915_private *i915,
  34. u64 rem)
  35. {
  36. int i;
  37. for (i = 0; i < ARRAY_SIZE(page_sizes); ++i) {
  38. unsigned int page_size = page_sizes[i];
  39. if (HAS_PAGE_SIZES(i915, page_size) && rem >= page_size)
  40. return page_size;
  41. }
  42. return 0;
  43. }
  44. static void huge_pages_free_pages(struct sg_table *st)
  45. {
  46. struct scatterlist *sg;
  47. for (sg = st->sgl; sg; sg = __sg_next(sg)) {
  48. if (sg_page(sg))
  49. __free_pages(sg_page(sg), get_order(sg->length));
  50. }
  51. sg_free_table(st);
  52. kfree(st);
  53. }
  54. static int get_huge_pages(struct drm_i915_gem_object *obj)
  55. {
  56. #define GFP (GFP_KERNEL | __GFP_NOWARN | __GFP_NORETRY)
  57. unsigned int page_mask = obj->mm.page_mask;
  58. struct sg_table *st;
  59. struct scatterlist *sg;
  60. unsigned int sg_page_sizes;
  61. u64 rem;
  62. st = kmalloc(sizeof(*st), GFP);
  63. if (!st)
  64. return -ENOMEM;
  65. if (sg_alloc_table(st, obj->base.size >> PAGE_SHIFT, GFP)) {
  66. kfree(st);
  67. return -ENOMEM;
  68. }
  69. rem = obj->base.size;
  70. sg = st->sgl;
  71. st->nents = 0;
  72. sg_page_sizes = 0;
  73. /*
  74. * Our goal here is simple, we want to greedily fill the object from
  75. * largest to smallest page-size, while ensuring that we use *every*
  76. * page-size as per the given page-mask.
  77. */
  78. do {
  79. unsigned int bit = ilog2(page_mask);
  80. unsigned int page_size = BIT(bit);
  81. int order = get_order(page_size);
  82. do {
  83. struct page *page;
  84. GEM_BUG_ON(order >= MAX_ORDER);
  85. page = alloc_pages(GFP | __GFP_ZERO, order);
  86. if (!page)
  87. goto err;
  88. sg_set_page(sg, page, page_size, 0);
  89. sg_page_sizes |= page_size;
  90. st->nents++;
  91. rem -= page_size;
  92. if (!rem) {
  93. sg_mark_end(sg);
  94. break;
  95. }
  96. sg = __sg_next(sg);
  97. } while ((rem - ((page_size-1) & page_mask)) >= page_size);
  98. page_mask &= (page_size-1);
  99. } while (page_mask);
  100. if (i915_gem_gtt_prepare_pages(obj, st))
  101. goto err;
  102. obj->mm.madv = I915_MADV_DONTNEED;
  103. GEM_BUG_ON(sg_page_sizes != obj->mm.page_mask);
  104. __i915_gem_object_set_pages(obj, st, sg_page_sizes);
  105. return 0;
  106. err:
  107. sg_set_page(sg, NULL, 0, 0);
  108. sg_mark_end(sg);
  109. huge_pages_free_pages(st);
  110. return -ENOMEM;
  111. }
  112. static void put_huge_pages(struct drm_i915_gem_object *obj,
  113. struct sg_table *pages)
  114. {
  115. i915_gem_gtt_finish_pages(obj, pages);
  116. huge_pages_free_pages(pages);
  117. obj->mm.dirty = false;
  118. obj->mm.madv = I915_MADV_WILLNEED;
  119. }
  120. static const struct drm_i915_gem_object_ops huge_page_ops = {
  121. .flags = I915_GEM_OBJECT_HAS_STRUCT_PAGE |
  122. I915_GEM_OBJECT_IS_SHRINKABLE,
  123. .get_pages = get_huge_pages,
  124. .put_pages = put_huge_pages,
  125. };
  126. static struct drm_i915_gem_object *
  127. huge_pages_object(struct drm_i915_private *i915,
  128. u64 size,
  129. unsigned int page_mask)
  130. {
  131. struct drm_i915_gem_object *obj;
  132. GEM_BUG_ON(!size);
  133. GEM_BUG_ON(!IS_ALIGNED(size, BIT(__ffs(page_mask))));
  134. if (size >> PAGE_SHIFT > INT_MAX)
  135. return ERR_PTR(-E2BIG);
  136. if (overflows_type(size, obj->base.size))
  137. return ERR_PTR(-E2BIG);
  138. obj = i915_gem_object_alloc(i915);
  139. if (!obj)
  140. return ERR_PTR(-ENOMEM);
  141. drm_gem_private_object_init(&i915->drm, &obj->base, size);
  142. i915_gem_object_init(obj, &huge_page_ops);
  143. obj->write_domain = I915_GEM_DOMAIN_CPU;
  144. obj->read_domains = I915_GEM_DOMAIN_CPU;
  145. obj->cache_level = I915_CACHE_NONE;
  146. obj->mm.page_mask = page_mask;
  147. return obj;
  148. }
  149. static int fake_get_huge_pages(struct drm_i915_gem_object *obj)
  150. {
  151. struct drm_i915_private *i915 = to_i915(obj->base.dev);
  152. const u64 max_len = rounddown_pow_of_two(UINT_MAX);
  153. struct sg_table *st;
  154. struct scatterlist *sg;
  155. unsigned int sg_page_sizes;
  156. u64 rem;
  157. st = kmalloc(sizeof(*st), GFP);
  158. if (!st)
  159. return -ENOMEM;
  160. if (sg_alloc_table(st, obj->base.size >> PAGE_SHIFT, GFP)) {
  161. kfree(st);
  162. return -ENOMEM;
  163. }
  164. /* Use optimal page sized chunks to fill in the sg table */
  165. rem = obj->base.size;
  166. sg = st->sgl;
  167. st->nents = 0;
  168. sg_page_sizes = 0;
  169. do {
  170. unsigned int page_size = get_largest_page_size(i915, rem);
  171. unsigned int len = min(page_size * div_u64(rem, page_size),
  172. max_len);
  173. GEM_BUG_ON(!page_size);
  174. sg->offset = 0;
  175. sg->length = len;
  176. sg_dma_len(sg) = len;
  177. sg_dma_address(sg) = page_size;
  178. sg_page_sizes |= len;
  179. st->nents++;
  180. rem -= len;
  181. if (!rem) {
  182. sg_mark_end(sg);
  183. break;
  184. }
  185. sg = sg_next(sg);
  186. } while (1);
  187. obj->mm.madv = I915_MADV_DONTNEED;
  188. __i915_gem_object_set_pages(obj, st, sg_page_sizes);
  189. return 0;
  190. }
  191. static int fake_get_huge_pages_single(struct drm_i915_gem_object *obj)
  192. {
  193. struct drm_i915_private *i915 = to_i915(obj->base.dev);
  194. struct sg_table *st;
  195. struct scatterlist *sg;
  196. unsigned int page_size;
  197. st = kmalloc(sizeof(*st), GFP);
  198. if (!st)
  199. return -ENOMEM;
  200. if (sg_alloc_table(st, 1, GFP)) {
  201. kfree(st);
  202. return -ENOMEM;
  203. }
  204. sg = st->sgl;
  205. st->nents = 1;
  206. page_size = get_largest_page_size(i915, obj->base.size);
  207. GEM_BUG_ON(!page_size);
  208. sg->offset = 0;
  209. sg->length = obj->base.size;
  210. sg_dma_len(sg) = obj->base.size;
  211. sg_dma_address(sg) = page_size;
  212. obj->mm.madv = I915_MADV_DONTNEED;
  213. __i915_gem_object_set_pages(obj, st, sg->length);
  214. return 0;
  215. #undef GFP
  216. }
  217. static void fake_free_huge_pages(struct drm_i915_gem_object *obj,
  218. struct sg_table *pages)
  219. {
  220. sg_free_table(pages);
  221. kfree(pages);
  222. }
  223. static void fake_put_huge_pages(struct drm_i915_gem_object *obj,
  224. struct sg_table *pages)
  225. {
  226. fake_free_huge_pages(obj, pages);
  227. obj->mm.dirty = false;
  228. obj->mm.madv = I915_MADV_WILLNEED;
  229. }
  230. static const struct drm_i915_gem_object_ops fake_ops = {
  231. .flags = I915_GEM_OBJECT_IS_SHRINKABLE,
  232. .get_pages = fake_get_huge_pages,
  233. .put_pages = fake_put_huge_pages,
  234. };
  235. static const struct drm_i915_gem_object_ops fake_ops_single = {
  236. .flags = I915_GEM_OBJECT_IS_SHRINKABLE,
  237. .get_pages = fake_get_huge_pages_single,
  238. .put_pages = fake_put_huge_pages,
  239. };
  240. static struct drm_i915_gem_object *
  241. fake_huge_pages_object(struct drm_i915_private *i915, u64 size, bool single)
  242. {
  243. struct drm_i915_gem_object *obj;
  244. GEM_BUG_ON(!size);
  245. GEM_BUG_ON(!IS_ALIGNED(size, I915_GTT_PAGE_SIZE));
  246. if (size >> PAGE_SHIFT > UINT_MAX)
  247. return ERR_PTR(-E2BIG);
  248. if (overflows_type(size, obj->base.size))
  249. return ERR_PTR(-E2BIG);
  250. obj = i915_gem_object_alloc(i915);
  251. if (!obj)
  252. return ERR_PTR(-ENOMEM);
  253. drm_gem_private_object_init(&i915->drm, &obj->base, size);
  254. if (single)
  255. i915_gem_object_init(obj, &fake_ops_single);
  256. else
  257. i915_gem_object_init(obj, &fake_ops);
  258. obj->write_domain = I915_GEM_DOMAIN_CPU;
  259. obj->read_domains = I915_GEM_DOMAIN_CPU;
  260. obj->cache_level = I915_CACHE_NONE;
  261. return obj;
  262. }
  263. static int igt_check_page_sizes(struct i915_vma *vma)
  264. {
  265. struct drm_i915_private *i915 = to_i915(vma->obj->base.dev);
  266. unsigned int supported = INTEL_INFO(i915)->page_sizes;
  267. struct drm_i915_gem_object *obj = vma->obj;
  268. int err = 0;
  269. if (!HAS_PAGE_SIZES(i915, vma->page_sizes.sg)) {
  270. pr_err("unsupported page_sizes.sg=%u, supported=%u\n",
  271. vma->page_sizes.sg & ~supported, supported);
  272. err = -EINVAL;
  273. }
  274. if (!HAS_PAGE_SIZES(i915, vma->page_sizes.gtt)) {
  275. pr_err("unsupported page_sizes.gtt=%u, supported=%u\n",
  276. vma->page_sizes.gtt & ~supported, supported);
  277. err = -EINVAL;
  278. }
  279. if (vma->page_sizes.phys != obj->mm.page_sizes.phys) {
  280. pr_err("vma->page_sizes.phys(%u) != obj->mm.page_sizes.phys(%u)\n",
  281. vma->page_sizes.phys, obj->mm.page_sizes.phys);
  282. err = -EINVAL;
  283. }
  284. if (vma->page_sizes.sg != obj->mm.page_sizes.sg) {
  285. pr_err("vma->page_sizes.sg(%u) != obj->mm.page_sizes.sg(%u)\n",
  286. vma->page_sizes.sg, obj->mm.page_sizes.sg);
  287. err = -EINVAL;
  288. }
  289. if (obj->mm.page_sizes.gtt) {
  290. pr_err("obj->page_sizes.gtt(%u) should never be set\n",
  291. obj->mm.page_sizes.gtt);
  292. err = -EINVAL;
  293. }
  294. return err;
  295. }
  296. static int igt_mock_exhaust_device_supported_pages(void *arg)
  297. {
  298. struct i915_hw_ppgtt *ppgtt = arg;
  299. struct drm_i915_private *i915 = ppgtt->base.i915;
  300. unsigned int saved_mask = INTEL_INFO(i915)->page_sizes;
  301. struct drm_i915_gem_object *obj;
  302. struct i915_vma *vma;
  303. int i, j, single;
  304. int err;
  305. /*
  306. * Sanity check creating objects with every valid page support
  307. * combination for our mock device.
  308. */
  309. for (i = 1; i < BIT(ARRAY_SIZE(page_sizes)); i++) {
  310. unsigned int combination = 0;
  311. for (j = 0; j < ARRAY_SIZE(page_sizes); j++) {
  312. if (i & BIT(j))
  313. combination |= page_sizes[j];
  314. }
  315. mkwrite_device_info(i915)->page_sizes = combination;
  316. for (single = 0; single <= 1; ++single) {
  317. obj = fake_huge_pages_object(i915, combination, !!single);
  318. if (IS_ERR(obj)) {
  319. err = PTR_ERR(obj);
  320. goto out_device;
  321. }
  322. if (obj->base.size != combination) {
  323. pr_err("obj->base.size=%zu, expected=%u\n",
  324. obj->base.size, combination);
  325. err = -EINVAL;
  326. goto out_put;
  327. }
  328. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  329. if (IS_ERR(vma)) {
  330. err = PTR_ERR(vma);
  331. goto out_put;
  332. }
  333. err = i915_vma_pin(vma, 0, 0, PIN_USER);
  334. if (err)
  335. goto out_close;
  336. err = igt_check_page_sizes(vma);
  337. if (vma->page_sizes.sg != combination) {
  338. pr_err("page_sizes.sg=%u, expected=%u\n",
  339. vma->page_sizes.sg, combination);
  340. err = -EINVAL;
  341. }
  342. i915_vma_unpin(vma);
  343. i915_vma_close(vma);
  344. i915_gem_object_put(obj);
  345. if (err)
  346. goto out_device;
  347. }
  348. }
  349. goto out_device;
  350. out_close:
  351. i915_vma_close(vma);
  352. out_put:
  353. i915_gem_object_put(obj);
  354. out_device:
  355. mkwrite_device_info(i915)->page_sizes = saved_mask;
  356. return err;
  357. }
  358. static int igt_mock_ppgtt_misaligned_dma(void *arg)
  359. {
  360. struct i915_hw_ppgtt *ppgtt = arg;
  361. struct drm_i915_private *i915 = ppgtt->base.i915;
  362. unsigned long supported = INTEL_INFO(i915)->page_sizes;
  363. struct drm_i915_gem_object *obj;
  364. int bit;
  365. int err;
  366. /*
  367. * Sanity check dma misalignment for huge pages -- the dma addresses we
  368. * insert into the paging structures need to always respect the page
  369. * size alignment.
  370. */
  371. bit = ilog2(I915_GTT_PAGE_SIZE_64K);
  372. for_each_set_bit_from(bit, &supported,
  373. ilog2(I915_GTT_MAX_PAGE_SIZE) + 1) {
  374. IGT_TIMEOUT(end_time);
  375. unsigned int page_size = BIT(bit);
  376. unsigned int flags = PIN_USER | PIN_OFFSET_FIXED;
  377. unsigned int offset;
  378. unsigned int size =
  379. round_up(page_size, I915_GTT_PAGE_SIZE_2M) << 1;
  380. struct i915_vma *vma;
  381. obj = fake_huge_pages_object(i915, size, true);
  382. if (IS_ERR(obj))
  383. return PTR_ERR(obj);
  384. if (obj->base.size != size) {
  385. pr_err("obj->base.size=%zu, expected=%u\n",
  386. obj->base.size, size);
  387. err = -EINVAL;
  388. goto out_put;
  389. }
  390. err = i915_gem_object_pin_pages(obj);
  391. if (err)
  392. goto out_put;
  393. /* Force the page size for this object */
  394. obj->mm.page_sizes.sg = page_size;
  395. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  396. if (IS_ERR(vma)) {
  397. err = PTR_ERR(vma);
  398. goto out_unpin;
  399. }
  400. err = i915_vma_pin(vma, 0, 0, flags);
  401. if (err) {
  402. i915_vma_close(vma);
  403. goto out_unpin;
  404. }
  405. err = igt_check_page_sizes(vma);
  406. if (vma->page_sizes.gtt != page_size) {
  407. pr_err("page_sizes.gtt=%u, expected %u\n",
  408. vma->page_sizes.gtt, page_size);
  409. err = -EINVAL;
  410. }
  411. i915_vma_unpin(vma);
  412. if (err) {
  413. i915_vma_close(vma);
  414. goto out_unpin;
  415. }
  416. /*
  417. * Try all the other valid offsets until the next
  418. * boundary -- should always fall back to using 4K
  419. * pages.
  420. */
  421. for (offset = 4096; offset < page_size; offset += 4096) {
  422. err = i915_vma_unbind(vma);
  423. if (err) {
  424. i915_vma_close(vma);
  425. goto out_unpin;
  426. }
  427. err = i915_vma_pin(vma, 0, 0, flags | offset);
  428. if (err) {
  429. i915_vma_close(vma);
  430. goto out_unpin;
  431. }
  432. err = igt_check_page_sizes(vma);
  433. if (vma->page_sizes.gtt != I915_GTT_PAGE_SIZE_4K) {
  434. pr_err("page_sizes.gtt=%u, expected %lu\n",
  435. vma->page_sizes.gtt, I915_GTT_PAGE_SIZE_4K);
  436. err = -EINVAL;
  437. }
  438. i915_vma_unpin(vma);
  439. if (err) {
  440. i915_vma_close(vma);
  441. goto out_unpin;
  442. }
  443. if (igt_timeout(end_time,
  444. "%s timed out at offset %x with page-size %x\n",
  445. __func__, offset, page_size))
  446. break;
  447. }
  448. i915_vma_close(vma);
  449. i915_gem_object_unpin_pages(obj);
  450. i915_gem_object_put(obj);
  451. }
  452. return 0;
  453. out_unpin:
  454. i915_gem_object_unpin_pages(obj);
  455. out_put:
  456. i915_gem_object_put(obj);
  457. return err;
  458. }
  459. static void close_object_list(struct list_head *objects,
  460. struct i915_hw_ppgtt *ppgtt)
  461. {
  462. struct drm_i915_gem_object *obj, *on;
  463. list_for_each_entry_safe(obj, on, objects, st_link) {
  464. struct i915_vma *vma;
  465. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  466. if (!IS_ERR(vma))
  467. i915_vma_close(vma);
  468. list_del(&obj->st_link);
  469. i915_gem_object_unpin_pages(obj);
  470. i915_gem_object_put(obj);
  471. }
  472. }
  473. static int igt_mock_ppgtt_huge_fill(void *arg)
  474. {
  475. struct i915_hw_ppgtt *ppgtt = arg;
  476. struct drm_i915_private *i915 = ppgtt->base.i915;
  477. unsigned long max_pages = ppgtt->base.total >> PAGE_SHIFT;
  478. unsigned long page_num;
  479. bool single = false;
  480. LIST_HEAD(objects);
  481. IGT_TIMEOUT(end_time);
  482. int err = -ENODEV;
  483. for_each_prime_number_from(page_num, 1, max_pages) {
  484. struct drm_i915_gem_object *obj;
  485. u64 size = page_num << PAGE_SHIFT;
  486. struct i915_vma *vma;
  487. unsigned int expected_gtt = 0;
  488. int i;
  489. obj = fake_huge_pages_object(i915, size, single);
  490. if (IS_ERR(obj)) {
  491. err = PTR_ERR(obj);
  492. break;
  493. }
  494. if (obj->base.size != size) {
  495. pr_err("obj->base.size=%zd, expected=%llu\n",
  496. obj->base.size, size);
  497. i915_gem_object_put(obj);
  498. err = -EINVAL;
  499. break;
  500. }
  501. err = i915_gem_object_pin_pages(obj);
  502. if (err) {
  503. i915_gem_object_put(obj);
  504. break;
  505. }
  506. list_add(&obj->st_link, &objects);
  507. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  508. if (IS_ERR(vma)) {
  509. err = PTR_ERR(vma);
  510. break;
  511. }
  512. err = i915_vma_pin(vma, 0, 0, PIN_USER);
  513. if (err)
  514. break;
  515. err = igt_check_page_sizes(vma);
  516. if (err) {
  517. i915_vma_unpin(vma);
  518. break;
  519. }
  520. /*
  521. * Figure out the expected gtt page size knowing that we go from
  522. * largest to smallest page size sg chunks, and that we align to
  523. * the largest page size.
  524. */
  525. for (i = 0; i < ARRAY_SIZE(page_sizes); ++i) {
  526. unsigned int page_size = page_sizes[i];
  527. if (HAS_PAGE_SIZES(i915, page_size) &&
  528. size >= page_size) {
  529. expected_gtt |= page_size;
  530. size &= page_size-1;
  531. }
  532. }
  533. GEM_BUG_ON(!expected_gtt);
  534. GEM_BUG_ON(size);
  535. if (expected_gtt & I915_GTT_PAGE_SIZE_4K)
  536. expected_gtt &= ~I915_GTT_PAGE_SIZE_64K;
  537. i915_vma_unpin(vma);
  538. if (vma->page_sizes.sg & I915_GTT_PAGE_SIZE_64K) {
  539. if (!IS_ALIGNED(vma->node.start,
  540. I915_GTT_PAGE_SIZE_2M)) {
  541. pr_err("node.start(%llx) not aligned to 2M\n",
  542. vma->node.start);
  543. err = -EINVAL;
  544. break;
  545. }
  546. if (!IS_ALIGNED(vma->node.size,
  547. I915_GTT_PAGE_SIZE_2M)) {
  548. pr_err("node.size(%llx) not aligned to 2M\n",
  549. vma->node.size);
  550. err = -EINVAL;
  551. break;
  552. }
  553. }
  554. if (vma->page_sizes.gtt != expected_gtt) {
  555. pr_err("gtt=%u, expected=%u, size=%zd, single=%s\n",
  556. vma->page_sizes.gtt, expected_gtt,
  557. obj->base.size, yesno(!!single));
  558. err = -EINVAL;
  559. break;
  560. }
  561. if (igt_timeout(end_time,
  562. "%s timed out at size %zd\n",
  563. __func__, obj->base.size))
  564. break;
  565. single = !single;
  566. }
  567. close_object_list(&objects, ppgtt);
  568. if (err == -ENOMEM || err == -ENOSPC)
  569. err = 0;
  570. return err;
  571. }
  572. static int igt_mock_ppgtt_64K(void *arg)
  573. {
  574. struct i915_hw_ppgtt *ppgtt = arg;
  575. struct drm_i915_private *i915 = ppgtt->base.i915;
  576. struct drm_i915_gem_object *obj;
  577. const struct object_info {
  578. unsigned int size;
  579. unsigned int gtt;
  580. unsigned int offset;
  581. } objects[] = {
  582. /* Cases with forced padding/alignment */
  583. {
  584. .size = SZ_64K,
  585. .gtt = I915_GTT_PAGE_SIZE_64K,
  586. .offset = 0,
  587. },
  588. {
  589. .size = SZ_64K + SZ_4K,
  590. .gtt = I915_GTT_PAGE_SIZE_4K,
  591. .offset = 0,
  592. },
  593. {
  594. .size = SZ_64K - SZ_4K,
  595. .gtt = I915_GTT_PAGE_SIZE_4K,
  596. .offset = 0,
  597. },
  598. {
  599. .size = SZ_2M,
  600. .gtt = I915_GTT_PAGE_SIZE_64K,
  601. .offset = 0,
  602. },
  603. {
  604. .size = SZ_2M - SZ_4K,
  605. .gtt = I915_GTT_PAGE_SIZE_4K,
  606. .offset = 0,
  607. },
  608. {
  609. .size = SZ_2M + SZ_4K,
  610. .gtt = I915_GTT_PAGE_SIZE_64K | I915_GTT_PAGE_SIZE_4K,
  611. .offset = 0,
  612. },
  613. {
  614. .size = SZ_2M + SZ_64K,
  615. .gtt = I915_GTT_PAGE_SIZE_64K,
  616. .offset = 0,
  617. },
  618. {
  619. .size = SZ_2M - SZ_64K,
  620. .gtt = I915_GTT_PAGE_SIZE_64K,
  621. .offset = 0,
  622. },
  623. /* Try without any forced padding/alignment */
  624. {
  625. .size = SZ_64K,
  626. .offset = SZ_2M,
  627. .gtt = I915_GTT_PAGE_SIZE_4K,
  628. },
  629. {
  630. .size = SZ_128K,
  631. .offset = SZ_2M - SZ_64K,
  632. .gtt = I915_GTT_PAGE_SIZE_4K,
  633. },
  634. };
  635. struct i915_vma *vma;
  636. int i, single;
  637. int err;
  638. /*
  639. * Sanity check some of the trickiness with 64K pages -- either we can
  640. * safely mark the whole page-table(2M block) as 64K, or we have to
  641. * always fallback to 4K.
  642. */
  643. if (!HAS_PAGE_SIZES(i915, I915_GTT_PAGE_SIZE_64K))
  644. return 0;
  645. for (i = 0; i < ARRAY_SIZE(objects); ++i) {
  646. unsigned int size = objects[i].size;
  647. unsigned int expected_gtt = objects[i].gtt;
  648. unsigned int offset = objects[i].offset;
  649. unsigned int flags = PIN_USER;
  650. for (single = 0; single <= 1; single++) {
  651. obj = fake_huge_pages_object(i915, size, !!single);
  652. if (IS_ERR(obj))
  653. return PTR_ERR(obj);
  654. err = i915_gem_object_pin_pages(obj);
  655. if (err)
  656. goto out_object_put;
  657. /*
  658. * Disable 2M pages -- We only want to use 64K/4K pages
  659. * for this test.
  660. */
  661. obj->mm.page_sizes.sg &= ~I915_GTT_PAGE_SIZE_2M;
  662. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  663. if (IS_ERR(vma)) {
  664. err = PTR_ERR(vma);
  665. goto out_object_unpin;
  666. }
  667. if (offset)
  668. flags |= PIN_OFFSET_FIXED | offset;
  669. err = i915_vma_pin(vma, 0, 0, flags);
  670. if (err)
  671. goto out_vma_close;
  672. err = igt_check_page_sizes(vma);
  673. if (err)
  674. goto out_vma_unpin;
  675. if (!offset && vma->page_sizes.sg & I915_GTT_PAGE_SIZE_64K) {
  676. if (!IS_ALIGNED(vma->node.start,
  677. I915_GTT_PAGE_SIZE_2M)) {
  678. pr_err("node.start(%llx) not aligned to 2M\n",
  679. vma->node.start);
  680. err = -EINVAL;
  681. goto out_vma_unpin;
  682. }
  683. if (!IS_ALIGNED(vma->node.size,
  684. I915_GTT_PAGE_SIZE_2M)) {
  685. pr_err("node.size(%llx) not aligned to 2M\n",
  686. vma->node.size);
  687. err = -EINVAL;
  688. goto out_vma_unpin;
  689. }
  690. }
  691. if (vma->page_sizes.gtt != expected_gtt) {
  692. pr_err("gtt=%u, expected=%u, i=%d, single=%s\n",
  693. vma->page_sizes.gtt, expected_gtt, i,
  694. yesno(!!single));
  695. err = -EINVAL;
  696. goto out_vma_unpin;
  697. }
  698. i915_vma_unpin(vma);
  699. i915_vma_close(vma);
  700. i915_gem_object_unpin_pages(obj);
  701. i915_gem_object_put(obj);
  702. }
  703. }
  704. return 0;
  705. out_vma_unpin:
  706. i915_vma_unpin(vma);
  707. out_vma_close:
  708. i915_vma_close(vma);
  709. out_object_unpin:
  710. i915_gem_object_unpin_pages(obj);
  711. out_object_put:
  712. i915_gem_object_put(obj);
  713. return err;
  714. }
  715. static struct i915_vma *
  716. gpu_write_dw(struct i915_vma *vma, u64 offset, u32 val)
  717. {
  718. struct drm_i915_private *i915 = to_i915(vma->obj->base.dev);
  719. const int gen = INTEL_GEN(vma->vm->i915);
  720. unsigned int count = vma->size >> PAGE_SHIFT;
  721. struct drm_i915_gem_object *obj;
  722. struct i915_vma *batch;
  723. unsigned int size;
  724. u32 *cmd;
  725. int n;
  726. int err;
  727. size = (1 + 4 * count) * sizeof(u32);
  728. size = round_up(size, PAGE_SIZE);
  729. obj = i915_gem_object_create_internal(i915, size);
  730. if (IS_ERR(obj))
  731. return ERR_CAST(obj);
  732. cmd = i915_gem_object_pin_map(obj, I915_MAP_WB);
  733. if (IS_ERR(cmd)) {
  734. err = PTR_ERR(cmd);
  735. goto err;
  736. }
  737. offset += vma->node.start;
  738. for (n = 0; n < count; n++) {
  739. if (gen >= 8) {
  740. *cmd++ = MI_STORE_DWORD_IMM_GEN4;
  741. *cmd++ = lower_32_bits(offset);
  742. *cmd++ = upper_32_bits(offset);
  743. *cmd++ = val;
  744. } else if (gen >= 4) {
  745. *cmd++ = MI_STORE_DWORD_IMM_GEN4 |
  746. (gen < 6 ? 1 << 22 : 0);
  747. *cmd++ = 0;
  748. *cmd++ = offset;
  749. *cmd++ = val;
  750. } else {
  751. *cmd++ = MI_STORE_DWORD_IMM | 1 << 22;
  752. *cmd++ = offset;
  753. *cmd++ = val;
  754. }
  755. offset += PAGE_SIZE;
  756. }
  757. *cmd = MI_BATCH_BUFFER_END;
  758. i915_gem_object_unpin_map(obj);
  759. err = i915_gem_object_set_to_gtt_domain(obj, false);
  760. if (err)
  761. goto err;
  762. batch = i915_vma_instance(obj, vma->vm, NULL);
  763. if (IS_ERR(batch)) {
  764. err = PTR_ERR(batch);
  765. goto err;
  766. }
  767. err = i915_vma_pin(batch, 0, 0, PIN_USER);
  768. if (err)
  769. goto err;
  770. return batch;
  771. err:
  772. i915_gem_object_put(obj);
  773. return ERR_PTR(err);
  774. }
  775. static int gpu_write(struct i915_vma *vma,
  776. struct i915_gem_context *ctx,
  777. struct intel_engine_cs *engine,
  778. u32 dword,
  779. u32 value)
  780. {
  781. struct i915_request *rq;
  782. struct i915_vma *batch;
  783. int flags = 0;
  784. int err;
  785. GEM_BUG_ON(!intel_engine_can_store_dword(engine));
  786. err = i915_gem_object_set_to_gtt_domain(vma->obj, true);
  787. if (err)
  788. return err;
  789. rq = i915_request_alloc(engine, ctx);
  790. if (IS_ERR(rq))
  791. return PTR_ERR(rq);
  792. batch = gpu_write_dw(vma, dword * sizeof(u32), value);
  793. if (IS_ERR(batch)) {
  794. err = PTR_ERR(batch);
  795. goto err_request;
  796. }
  797. i915_vma_move_to_active(batch, rq, 0);
  798. i915_gem_object_set_active_reference(batch->obj);
  799. i915_vma_unpin(batch);
  800. i915_vma_close(batch);
  801. err = engine->emit_bb_start(rq,
  802. batch->node.start, batch->node.size,
  803. flags);
  804. if (err)
  805. goto err_request;
  806. i915_vma_move_to_active(vma, rq, EXEC_OBJECT_WRITE);
  807. reservation_object_lock(vma->resv, NULL);
  808. reservation_object_add_excl_fence(vma->resv, &rq->fence);
  809. reservation_object_unlock(vma->resv);
  810. err_request:
  811. __i915_request_add(rq, err == 0);
  812. return err;
  813. }
  814. static int cpu_check(struct drm_i915_gem_object *obj, u32 dword, u32 val)
  815. {
  816. unsigned int needs_flush;
  817. unsigned long n;
  818. int err;
  819. err = i915_gem_obj_prepare_shmem_read(obj, &needs_flush);
  820. if (err)
  821. return err;
  822. for (n = 0; n < obj->base.size >> PAGE_SHIFT; ++n) {
  823. u32 *ptr = kmap_atomic(i915_gem_object_get_page(obj, n));
  824. if (needs_flush & CLFLUSH_BEFORE)
  825. drm_clflush_virt_range(ptr, PAGE_SIZE);
  826. if (ptr[dword] != val) {
  827. pr_err("n=%lu ptr[%u]=%u, val=%u\n",
  828. n, dword, ptr[dword], val);
  829. kunmap_atomic(ptr);
  830. err = -EINVAL;
  831. break;
  832. }
  833. kunmap_atomic(ptr);
  834. }
  835. i915_gem_obj_finish_shmem_access(obj);
  836. return err;
  837. }
  838. static int __igt_write_huge(struct i915_gem_context *ctx,
  839. struct intel_engine_cs *engine,
  840. struct drm_i915_gem_object *obj,
  841. u64 size, u64 offset,
  842. u32 dword, u32 val)
  843. {
  844. struct drm_i915_private *i915 = to_i915(obj->base.dev);
  845. struct i915_address_space *vm = ctx->ppgtt ? &ctx->ppgtt->base : &i915->ggtt.base;
  846. unsigned int flags = PIN_USER | PIN_OFFSET_FIXED;
  847. struct i915_vma *vma;
  848. int err;
  849. vma = i915_vma_instance(obj, vm, NULL);
  850. if (IS_ERR(vma))
  851. return PTR_ERR(vma);
  852. err = i915_vma_unbind(vma);
  853. if (err)
  854. goto out_vma_close;
  855. err = i915_vma_pin(vma, size, 0, flags | offset);
  856. if (err) {
  857. /*
  858. * The ggtt may have some pages reserved so
  859. * refrain from erroring out.
  860. */
  861. if (err == -ENOSPC && i915_is_ggtt(vm))
  862. err = 0;
  863. goto out_vma_close;
  864. }
  865. err = igt_check_page_sizes(vma);
  866. if (err)
  867. goto out_vma_unpin;
  868. err = gpu_write(vma, ctx, engine, dword, val);
  869. if (err) {
  870. pr_err("gpu-write failed at offset=%llx\n", offset);
  871. goto out_vma_unpin;
  872. }
  873. err = cpu_check(obj, dword, val);
  874. if (err) {
  875. pr_err("cpu-check failed at offset=%llx\n", offset);
  876. goto out_vma_unpin;
  877. }
  878. out_vma_unpin:
  879. i915_vma_unpin(vma);
  880. out_vma_close:
  881. i915_vma_destroy(vma);
  882. return err;
  883. }
  884. static int igt_write_huge(struct i915_gem_context *ctx,
  885. struct drm_i915_gem_object *obj)
  886. {
  887. struct drm_i915_private *i915 = to_i915(obj->base.dev);
  888. struct i915_address_space *vm = ctx->ppgtt ? &ctx->ppgtt->base : &i915->ggtt.base;
  889. static struct intel_engine_cs *engines[I915_NUM_ENGINES];
  890. struct intel_engine_cs *engine;
  891. I915_RND_STATE(prng);
  892. IGT_TIMEOUT(end_time);
  893. unsigned int max_page_size;
  894. unsigned int id;
  895. u64 max;
  896. u64 num;
  897. u64 size;
  898. int *order;
  899. int i, n;
  900. int err = 0;
  901. GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
  902. size = obj->base.size;
  903. if (obj->mm.page_sizes.sg & I915_GTT_PAGE_SIZE_64K)
  904. size = round_up(size, I915_GTT_PAGE_SIZE_2M);
  905. max_page_size = rounddown_pow_of_two(obj->mm.page_sizes.sg);
  906. max = div_u64((vm->total - size), max_page_size);
  907. n = 0;
  908. for_each_engine(engine, i915, id) {
  909. if (!intel_engine_can_store_dword(engine)) {
  910. pr_info("store-dword-imm not supported on engine=%u\n", id);
  911. continue;
  912. }
  913. engines[n++] = engine;
  914. }
  915. if (!n)
  916. return 0;
  917. /*
  918. * To keep things interesting when alternating between engines in our
  919. * randomized order, lets also make feeding to the same engine a few
  920. * times in succession a possibility by enlarging the permutation array.
  921. */
  922. order = i915_random_order(n * I915_NUM_ENGINES, &prng);
  923. if (!order)
  924. return -ENOMEM;
  925. /*
  926. * Try various offsets in an ascending/descending fashion until we
  927. * timeout -- we want to avoid issues hidden by effectively always using
  928. * offset = 0.
  929. */
  930. i = 0;
  931. for_each_prime_number_from(num, 0, max) {
  932. u64 offset_low = num * max_page_size;
  933. u64 offset_high = (max - num) * max_page_size;
  934. u32 dword = offset_in_page(num) / 4;
  935. engine = engines[order[i] % n];
  936. i = (i + 1) % (n * I915_NUM_ENGINES);
  937. err = __igt_write_huge(ctx, engine, obj, size, offset_low, dword, num + 1);
  938. if (err)
  939. break;
  940. err = __igt_write_huge(ctx, engine, obj, size, offset_high, dword, num + 1);
  941. if (err)
  942. break;
  943. if (igt_timeout(end_time,
  944. "%s timed out on engine=%u, offset_low=%llx offset_high=%llx, max_page_size=%x\n",
  945. __func__, engine->id, offset_low, offset_high, max_page_size))
  946. break;
  947. }
  948. kfree(order);
  949. return err;
  950. }
  951. static int igt_ppgtt_exhaust_huge(void *arg)
  952. {
  953. struct i915_gem_context *ctx = arg;
  954. struct drm_i915_private *i915 = ctx->i915;
  955. unsigned long supported = INTEL_INFO(i915)->page_sizes;
  956. static unsigned int pages[ARRAY_SIZE(page_sizes)];
  957. struct drm_i915_gem_object *obj;
  958. unsigned int size_mask;
  959. unsigned int page_mask;
  960. int n, i;
  961. int err = -ENODEV;
  962. if (supported == I915_GTT_PAGE_SIZE_4K)
  963. return 0;
  964. /*
  965. * Sanity check creating objects with a varying mix of page sizes --
  966. * ensuring that our writes lands in the right place.
  967. */
  968. n = 0;
  969. for_each_set_bit(i, &supported, ilog2(I915_GTT_MAX_PAGE_SIZE) + 1)
  970. pages[n++] = BIT(i);
  971. for (size_mask = 2; size_mask < BIT(n); size_mask++) {
  972. unsigned int size = 0;
  973. for (i = 0; i < n; i++) {
  974. if (size_mask & BIT(i))
  975. size |= pages[i];
  976. }
  977. /*
  978. * For our page mask we want to enumerate all the page-size
  979. * combinations which will fit into our chosen object size.
  980. */
  981. for (page_mask = 2; page_mask <= size_mask; page_mask++) {
  982. unsigned int page_sizes = 0;
  983. for (i = 0; i < n; i++) {
  984. if (page_mask & BIT(i))
  985. page_sizes |= pages[i];
  986. }
  987. /*
  988. * Ensure that we can actually fill the given object
  989. * with our chosen page mask.
  990. */
  991. if (!IS_ALIGNED(size, BIT(__ffs(page_sizes))))
  992. continue;
  993. obj = huge_pages_object(i915, size, page_sizes);
  994. if (IS_ERR(obj)) {
  995. err = PTR_ERR(obj);
  996. goto out_device;
  997. }
  998. err = i915_gem_object_pin_pages(obj);
  999. if (err) {
  1000. i915_gem_object_put(obj);
  1001. if (err == -ENOMEM) {
  1002. pr_info("unable to get pages, size=%u, pages=%u\n",
  1003. size, page_sizes);
  1004. err = 0;
  1005. break;
  1006. }
  1007. pr_err("pin_pages failed, size=%u, pages=%u\n",
  1008. size_mask, page_mask);
  1009. goto out_device;
  1010. }
  1011. /* Force the page-size for the gtt insertion */
  1012. obj->mm.page_sizes.sg = page_sizes;
  1013. err = igt_write_huge(ctx, obj);
  1014. if (err) {
  1015. pr_err("exhaust write-huge failed with size=%u\n",
  1016. size);
  1017. goto out_unpin;
  1018. }
  1019. i915_gem_object_unpin_pages(obj);
  1020. i915_gem_object_put(obj);
  1021. }
  1022. }
  1023. goto out_device;
  1024. out_unpin:
  1025. i915_gem_object_unpin_pages(obj);
  1026. i915_gem_object_put(obj);
  1027. out_device:
  1028. mkwrite_device_info(i915)->page_sizes = supported;
  1029. return err;
  1030. }
  1031. static int igt_ppgtt_internal_huge(void *arg)
  1032. {
  1033. struct i915_gem_context *ctx = arg;
  1034. struct drm_i915_private *i915 = ctx->i915;
  1035. struct drm_i915_gem_object *obj;
  1036. static const unsigned int sizes[] = {
  1037. SZ_64K,
  1038. SZ_128K,
  1039. SZ_256K,
  1040. SZ_512K,
  1041. SZ_1M,
  1042. SZ_2M,
  1043. };
  1044. int i;
  1045. int err;
  1046. /*
  1047. * Sanity check that the HW uses huge pages correctly through internal
  1048. * -- ensure that our writes land in the right place.
  1049. */
  1050. for (i = 0; i < ARRAY_SIZE(sizes); ++i) {
  1051. unsigned int size = sizes[i];
  1052. obj = i915_gem_object_create_internal(i915, size);
  1053. if (IS_ERR(obj))
  1054. return PTR_ERR(obj);
  1055. err = i915_gem_object_pin_pages(obj);
  1056. if (err)
  1057. goto out_put;
  1058. if (obj->mm.page_sizes.phys < I915_GTT_PAGE_SIZE_64K) {
  1059. pr_info("internal unable to allocate huge-page(s) with size=%u\n",
  1060. size);
  1061. goto out_unpin;
  1062. }
  1063. err = igt_write_huge(ctx, obj);
  1064. if (err) {
  1065. pr_err("internal write-huge failed with size=%u\n",
  1066. size);
  1067. goto out_unpin;
  1068. }
  1069. i915_gem_object_unpin_pages(obj);
  1070. i915_gem_object_put(obj);
  1071. }
  1072. return 0;
  1073. out_unpin:
  1074. i915_gem_object_unpin_pages(obj);
  1075. out_put:
  1076. i915_gem_object_put(obj);
  1077. return err;
  1078. }
  1079. static inline bool igt_can_allocate_thp(struct drm_i915_private *i915)
  1080. {
  1081. return i915->mm.gemfs && has_transparent_hugepage();
  1082. }
  1083. static int igt_ppgtt_gemfs_huge(void *arg)
  1084. {
  1085. struct i915_gem_context *ctx = arg;
  1086. struct drm_i915_private *i915 = ctx->i915;
  1087. struct drm_i915_gem_object *obj;
  1088. static const unsigned int sizes[] = {
  1089. SZ_2M,
  1090. SZ_4M,
  1091. SZ_8M,
  1092. SZ_16M,
  1093. SZ_32M,
  1094. };
  1095. int i;
  1096. int err;
  1097. /*
  1098. * Sanity check that the HW uses huge pages correctly through gemfs --
  1099. * ensure that our writes land in the right place.
  1100. */
  1101. if (!igt_can_allocate_thp(i915)) {
  1102. pr_info("missing THP support, skipping\n");
  1103. return 0;
  1104. }
  1105. for (i = 0; i < ARRAY_SIZE(sizes); ++i) {
  1106. unsigned int size = sizes[i];
  1107. obj = i915_gem_object_create(i915, size);
  1108. if (IS_ERR(obj))
  1109. return PTR_ERR(obj);
  1110. err = i915_gem_object_pin_pages(obj);
  1111. if (err)
  1112. goto out_put;
  1113. if (obj->mm.page_sizes.phys < I915_GTT_PAGE_SIZE_2M) {
  1114. pr_info("finishing test early, gemfs unable to allocate huge-page(s) with size=%u\n",
  1115. size);
  1116. goto out_unpin;
  1117. }
  1118. err = igt_write_huge(ctx, obj);
  1119. if (err) {
  1120. pr_err("gemfs write-huge failed with size=%u\n",
  1121. size);
  1122. goto out_unpin;
  1123. }
  1124. i915_gem_object_unpin_pages(obj);
  1125. i915_gem_object_put(obj);
  1126. }
  1127. return 0;
  1128. out_unpin:
  1129. i915_gem_object_unpin_pages(obj);
  1130. out_put:
  1131. i915_gem_object_put(obj);
  1132. return err;
  1133. }
  1134. static int igt_ppgtt_pin_update(void *arg)
  1135. {
  1136. struct i915_gem_context *ctx = arg;
  1137. struct drm_i915_private *dev_priv = ctx->i915;
  1138. unsigned long supported = INTEL_INFO(dev_priv)->page_sizes;
  1139. struct i915_hw_ppgtt *ppgtt = ctx->ppgtt;
  1140. struct drm_i915_gem_object *obj;
  1141. struct i915_vma *vma;
  1142. unsigned int flags = PIN_USER | PIN_OFFSET_FIXED;
  1143. int first, last;
  1144. int err;
  1145. /*
  1146. * Make sure there's no funny business when doing a PIN_UPDATE -- in the
  1147. * past we had a subtle issue with being able to incorrectly do multiple
  1148. * alloc va ranges on the same object when doing a PIN_UPDATE, which
  1149. * resulted in some pretty nasty bugs, though only when using
  1150. * huge-gtt-pages.
  1151. */
  1152. if (!USES_FULL_48BIT_PPGTT(dev_priv)) {
  1153. pr_info("48b PPGTT not supported, skipping\n");
  1154. return 0;
  1155. }
  1156. first = ilog2(I915_GTT_PAGE_SIZE_64K);
  1157. last = ilog2(I915_GTT_PAGE_SIZE_2M);
  1158. for_each_set_bit_from(first, &supported, last + 1) {
  1159. unsigned int page_size = BIT(first);
  1160. obj = i915_gem_object_create_internal(dev_priv, page_size);
  1161. if (IS_ERR(obj))
  1162. return PTR_ERR(obj);
  1163. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  1164. if (IS_ERR(vma)) {
  1165. err = PTR_ERR(vma);
  1166. goto out_put;
  1167. }
  1168. err = i915_vma_pin(vma, SZ_2M, 0, flags);
  1169. if (err)
  1170. goto out_close;
  1171. if (vma->page_sizes.sg < page_size) {
  1172. pr_info("Unable to allocate page-size %x, finishing test early\n",
  1173. page_size);
  1174. goto out_unpin;
  1175. }
  1176. err = igt_check_page_sizes(vma);
  1177. if (err)
  1178. goto out_unpin;
  1179. if (vma->page_sizes.gtt != page_size) {
  1180. dma_addr_t addr = i915_gem_object_get_dma_address(obj, 0);
  1181. /*
  1182. * The only valid reason for this to ever fail would be
  1183. * if the dma-mapper screwed us over when we did the
  1184. * dma_map_sg(), since it has the final say over the dma
  1185. * address.
  1186. */
  1187. if (IS_ALIGNED(addr, page_size)) {
  1188. pr_err("page_sizes.gtt=%u, expected=%u\n",
  1189. vma->page_sizes.gtt, page_size);
  1190. err = -EINVAL;
  1191. } else {
  1192. pr_info("dma address misaligned, finishing test early\n");
  1193. }
  1194. goto out_unpin;
  1195. }
  1196. err = i915_vma_bind(vma, I915_CACHE_NONE, PIN_UPDATE);
  1197. if (err)
  1198. goto out_unpin;
  1199. i915_vma_unpin(vma);
  1200. i915_vma_close(vma);
  1201. i915_gem_object_put(obj);
  1202. }
  1203. obj = i915_gem_object_create_internal(dev_priv, PAGE_SIZE);
  1204. if (IS_ERR(obj))
  1205. return PTR_ERR(obj);
  1206. vma = i915_vma_instance(obj, &ppgtt->base, NULL);
  1207. if (IS_ERR(vma)) {
  1208. err = PTR_ERR(vma);
  1209. goto out_put;
  1210. }
  1211. err = i915_vma_pin(vma, 0, 0, flags);
  1212. if (err)
  1213. goto out_close;
  1214. /*
  1215. * Make sure we don't end up with something like where the pde is still
  1216. * pointing to the 2M page, and the pt we just filled-in is dangling --
  1217. * we can check this by writing to the first page where it would then
  1218. * land in the now stale 2M page.
  1219. */
  1220. err = gpu_write(vma, ctx, dev_priv->engine[RCS], 0, 0xdeadbeaf);
  1221. if (err)
  1222. goto out_unpin;
  1223. err = cpu_check(obj, 0, 0xdeadbeaf);
  1224. out_unpin:
  1225. i915_vma_unpin(vma);
  1226. out_close:
  1227. i915_vma_close(vma);
  1228. out_put:
  1229. i915_gem_object_put(obj);
  1230. return err;
  1231. }
  1232. static int igt_tmpfs_fallback(void *arg)
  1233. {
  1234. struct i915_gem_context *ctx = arg;
  1235. struct drm_i915_private *i915 = ctx->i915;
  1236. struct vfsmount *gemfs = i915->mm.gemfs;
  1237. struct i915_address_space *vm = ctx->ppgtt ? &ctx->ppgtt->base : &i915->ggtt.base;
  1238. struct drm_i915_gem_object *obj;
  1239. struct i915_vma *vma;
  1240. u32 *vaddr;
  1241. int err = 0;
  1242. /*
  1243. * Make sure that we don't burst into a ball of flames upon falling back
  1244. * to tmpfs, which we rely on if on the off-chance we encouter a failure
  1245. * when setting up gemfs.
  1246. */
  1247. i915->mm.gemfs = NULL;
  1248. obj = i915_gem_object_create(i915, PAGE_SIZE);
  1249. if (IS_ERR(obj)) {
  1250. err = PTR_ERR(obj);
  1251. goto out_restore;
  1252. }
  1253. vaddr = i915_gem_object_pin_map(obj, I915_MAP_WB);
  1254. if (IS_ERR(vaddr)) {
  1255. err = PTR_ERR(vaddr);
  1256. goto out_put;
  1257. }
  1258. *vaddr = 0xdeadbeaf;
  1259. i915_gem_object_unpin_map(obj);
  1260. vma = i915_vma_instance(obj, vm, NULL);
  1261. if (IS_ERR(vma)) {
  1262. err = PTR_ERR(vma);
  1263. goto out_put;
  1264. }
  1265. err = i915_vma_pin(vma, 0, 0, PIN_USER);
  1266. if (err)
  1267. goto out_close;
  1268. err = igt_check_page_sizes(vma);
  1269. i915_vma_unpin(vma);
  1270. out_close:
  1271. i915_vma_close(vma);
  1272. out_put:
  1273. i915_gem_object_put(obj);
  1274. out_restore:
  1275. i915->mm.gemfs = gemfs;
  1276. return err;
  1277. }
  1278. static int igt_shrink_thp(void *arg)
  1279. {
  1280. struct i915_gem_context *ctx = arg;
  1281. struct drm_i915_private *i915 = ctx->i915;
  1282. struct i915_address_space *vm = ctx->ppgtt ? &ctx->ppgtt->base : &i915->ggtt.base;
  1283. struct drm_i915_gem_object *obj;
  1284. struct i915_vma *vma;
  1285. unsigned int flags = PIN_USER;
  1286. int err;
  1287. /*
  1288. * Sanity check shrinking huge-paged object -- make sure nothing blows
  1289. * up.
  1290. */
  1291. if (!igt_can_allocate_thp(i915)) {
  1292. pr_info("missing THP support, skipping\n");
  1293. return 0;
  1294. }
  1295. obj = i915_gem_object_create(i915, SZ_2M);
  1296. if (IS_ERR(obj))
  1297. return PTR_ERR(obj);
  1298. vma = i915_vma_instance(obj, vm, NULL);
  1299. if (IS_ERR(vma)) {
  1300. err = PTR_ERR(vma);
  1301. goto out_put;
  1302. }
  1303. err = i915_vma_pin(vma, 0, 0, flags);
  1304. if (err)
  1305. goto out_close;
  1306. if (obj->mm.page_sizes.phys < I915_GTT_PAGE_SIZE_2M) {
  1307. pr_info("failed to allocate THP, finishing test early\n");
  1308. goto out_unpin;
  1309. }
  1310. err = igt_check_page_sizes(vma);
  1311. if (err)
  1312. goto out_unpin;
  1313. err = gpu_write(vma, ctx, i915->engine[RCS], 0, 0xdeadbeaf);
  1314. if (err)
  1315. goto out_unpin;
  1316. i915_vma_unpin(vma);
  1317. /*
  1318. * Now that the pages are *unpinned* shrink-all should invoke
  1319. * shmem to truncate our pages.
  1320. */
  1321. i915_gem_shrink_all(i915);
  1322. if (i915_gem_object_has_pages(obj)) {
  1323. pr_err("shrink-all didn't truncate the pages\n");
  1324. err = -EINVAL;
  1325. goto out_close;
  1326. }
  1327. if (obj->mm.page_sizes.sg || obj->mm.page_sizes.phys) {
  1328. pr_err("residual page-size bits left\n");
  1329. err = -EINVAL;
  1330. goto out_close;
  1331. }
  1332. err = i915_vma_pin(vma, 0, 0, flags);
  1333. if (err)
  1334. goto out_close;
  1335. err = cpu_check(obj, 0, 0xdeadbeaf);
  1336. out_unpin:
  1337. i915_vma_unpin(vma);
  1338. out_close:
  1339. i915_vma_close(vma);
  1340. out_put:
  1341. i915_gem_object_put(obj);
  1342. return err;
  1343. }
  1344. int i915_gem_huge_page_mock_selftests(void)
  1345. {
  1346. static const struct i915_subtest tests[] = {
  1347. SUBTEST(igt_mock_exhaust_device_supported_pages),
  1348. SUBTEST(igt_mock_ppgtt_misaligned_dma),
  1349. SUBTEST(igt_mock_ppgtt_huge_fill),
  1350. SUBTEST(igt_mock_ppgtt_64K),
  1351. };
  1352. int saved_ppgtt = i915_modparams.enable_ppgtt;
  1353. struct drm_i915_private *dev_priv;
  1354. struct pci_dev *pdev;
  1355. struct i915_hw_ppgtt *ppgtt;
  1356. int err;
  1357. dev_priv = mock_gem_device();
  1358. if (!dev_priv)
  1359. return -ENOMEM;
  1360. /* Pretend to be a device which supports the 48b PPGTT */
  1361. i915_modparams.enable_ppgtt = 3;
  1362. pdev = dev_priv->drm.pdev;
  1363. dma_coerce_mask_and_coherent(&pdev->dev, DMA_BIT_MASK(39));
  1364. mutex_lock(&dev_priv->drm.struct_mutex);
  1365. ppgtt = i915_ppgtt_create(dev_priv, ERR_PTR(-ENODEV), "mock");
  1366. if (IS_ERR(ppgtt)) {
  1367. err = PTR_ERR(ppgtt);
  1368. goto out_unlock;
  1369. }
  1370. if (!i915_vm_is_48bit(&ppgtt->base)) {
  1371. pr_err("failed to create 48b PPGTT\n");
  1372. err = -EINVAL;
  1373. goto out_close;
  1374. }
  1375. /* If we were ever hit this then it's time to mock the 64K scratch */
  1376. if (!i915_vm_has_scratch_64K(&ppgtt->base)) {
  1377. pr_err("PPGTT missing 64K scratch page\n");
  1378. err = -EINVAL;
  1379. goto out_close;
  1380. }
  1381. err = i915_subtests(tests, ppgtt);
  1382. out_close:
  1383. i915_ppgtt_close(&ppgtt->base);
  1384. i915_ppgtt_put(ppgtt);
  1385. out_unlock:
  1386. mutex_unlock(&dev_priv->drm.struct_mutex);
  1387. i915_modparams.enable_ppgtt = saved_ppgtt;
  1388. drm_dev_unref(&dev_priv->drm);
  1389. return err;
  1390. }
  1391. int i915_gem_huge_page_live_selftests(struct drm_i915_private *dev_priv)
  1392. {
  1393. static const struct i915_subtest tests[] = {
  1394. SUBTEST(igt_shrink_thp),
  1395. SUBTEST(igt_ppgtt_pin_update),
  1396. SUBTEST(igt_tmpfs_fallback),
  1397. SUBTEST(igt_ppgtt_exhaust_huge),
  1398. SUBTEST(igt_ppgtt_gemfs_huge),
  1399. SUBTEST(igt_ppgtt_internal_huge),
  1400. };
  1401. struct drm_file *file;
  1402. struct i915_gem_context *ctx;
  1403. int err;
  1404. if (!USES_PPGTT(dev_priv)) {
  1405. pr_info("PPGTT not supported, skipping live-selftests\n");
  1406. return 0;
  1407. }
  1408. file = mock_file(dev_priv);
  1409. if (IS_ERR(file))
  1410. return PTR_ERR(file);
  1411. mutex_lock(&dev_priv->drm.struct_mutex);
  1412. intel_runtime_pm_get(dev_priv);
  1413. ctx = live_context(dev_priv, file);
  1414. if (IS_ERR(ctx)) {
  1415. err = PTR_ERR(ctx);
  1416. goto out_unlock;
  1417. }
  1418. if (ctx->ppgtt)
  1419. ctx->ppgtt->base.scrub_64K = true;
  1420. err = i915_subtests(tests, ctx);
  1421. out_unlock:
  1422. intel_runtime_pm_put(dev_priv);
  1423. mutex_unlock(&dev_priv->drm.struct_mutex);
  1424. mock_file_free(dev_priv, file);
  1425. return err;
  1426. }