io-pgtable-arm.c 31 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190
  1. /*
  2. * CPU-agnostic ARM page table allocator.
  3. *
  4. * This program is free software; you can redistribute it and/or modify
  5. * it under the terms of the GNU General Public License version 2 as
  6. * published by the Free Software Foundation.
  7. *
  8. * This program is distributed in the hope that it will be useful,
  9. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. * GNU General Public License for more details.
  12. *
  13. * You should have received a copy of the GNU General Public License
  14. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  15. *
  16. * Copyright (C) 2014 ARM Limited
  17. *
  18. * Author: Will Deacon <will.deacon@arm.com>
  19. */
  20. #define pr_fmt(fmt) "arm-lpae io-pgtable: " fmt
  21. #include <linux/atomic.h>
  22. #include <linux/bitops.h>
  23. #include <linux/iommu.h>
  24. #include <linux/kernel.h>
  25. #include <linux/sizes.h>
  26. #include <linux/slab.h>
  27. #include <linux/types.h>
  28. #include <linux/dma-mapping.h>
  29. #include <asm/barrier.h>
  30. #include "io-pgtable.h"
  31. #define ARM_LPAE_MAX_ADDR_BITS 52
  32. #define ARM_LPAE_S2_MAX_CONCAT_PAGES 16
  33. #define ARM_LPAE_MAX_LEVELS 4
  34. /* Struct accessors */
  35. #define io_pgtable_to_data(x) \
  36. container_of((x), struct arm_lpae_io_pgtable, iop)
  37. #define io_pgtable_ops_to_data(x) \
  38. io_pgtable_to_data(io_pgtable_ops_to_pgtable(x))
  39. /*
  40. * For consistency with the architecture, we always consider
  41. * ARM_LPAE_MAX_LEVELS levels, with the walk starting at level n >=0
  42. */
  43. #define ARM_LPAE_START_LVL(d) (ARM_LPAE_MAX_LEVELS - (d)->levels)
  44. /*
  45. * Calculate the right shift amount to get to the portion describing level l
  46. * in a virtual address mapped by the pagetable in d.
  47. */
  48. #define ARM_LPAE_LVL_SHIFT(l,d) \
  49. ((((d)->levels - ((l) - ARM_LPAE_START_LVL(d) + 1)) \
  50. * (d)->bits_per_level) + (d)->pg_shift)
  51. #define ARM_LPAE_GRANULE(d) (1UL << (d)->pg_shift)
  52. #define ARM_LPAE_PAGES_PER_PGD(d) \
  53. DIV_ROUND_UP((d)->pgd_size, ARM_LPAE_GRANULE(d))
  54. /*
  55. * Calculate the index at level l used to map virtual address a using the
  56. * pagetable in d.
  57. */
  58. #define ARM_LPAE_PGD_IDX(l,d) \
  59. ((l) == ARM_LPAE_START_LVL(d) ? ilog2(ARM_LPAE_PAGES_PER_PGD(d)) : 0)
  60. #define ARM_LPAE_LVL_IDX(a,l,d) \
  61. (((u64)(a) >> ARM_LPAE_LVL_SHIFT(l,d)) & \
  62. ((1 << ((d)->bits_per_level + ARM_LPAE_PGD_IDX(l,d))) - 1))
  63. /* Calculate the block/page mapping size at level l for pagetable in d. */
  64. #define ARM_LPAE_BLOCK_SIZE(l,d) \
  65. (1ULL << (ilog2(sizeof(arm_lpae_iopte)) + \
  66. ((ARM_LPAE_MAX_LEVELS - (l)) * (d)->bits_per_level)))
  67. /* Page table bits */
  68. #define ARM_LPAE_PTE_TYPE_SHIFT 0
  69. #define ARM_LPAE_PTE_TYPE_MASK 0x3
  70. #define ARM_LPAE_PTE_TYPE_BLOCK 1
  71. #define ARM_LPAE_PTE_TYPE_TABLE 3
  72. #define ARM_LPAE_PTE_TYPE_PAGE 3
  73. #define ARM_LPAE_PTE_ADDR_MASK GENMASK_ULL(47,12)
  74. #define ARM_LPAE_PTE_NSTABLE (((arm_lpae_iopte)1) << 63)
  75. #define ARM_LPAE_PTE_XN (((arm_lpae_iopte)3) << 53)
  76. #define ARM_LPAE_PTE_AF (((arm_lpae_iopte)1) << 10)
  77. #define ARM_LPAE_PTE_SH_NS (((arm_lpae_iopte)0) << 8)
  78. #define ARM_LPAE_PTE_SH_OS (((arm_lpae_iopte)2) << 8)
  79. #define ARM_LPAE_PTE_SH_IS (((arm_lpae_iopte)3) << 8)
  80. #define ARM_LPAE_PTE_NS (((arm_lpae_iopte)1) << 5)
  81. #define ARM_LPAE_PTE_VALID (((arm_lpae_iopte)1) << 0)
  82. #define ARM_LPAE_PTE_ATTR_LO_MASK (((arm_lpae_iopte)0x3ff) << 2)
  83. /* Ignore the contiguous bit for block splitting */
  84. #define ARM_LPAE_PTE_ATTR_HI_MASK (((arm_lpae_iopte)6) << 52)
  85. #define ARM_LPAE_PTE_ATTR_MASK (ARM_LPAE_PTE_ATTR_LO_MASK | \
  86. ARM_LPAE_PTE_ATTR_HI_MASK)
  87. /* Software bit for solving coherency races */
  88. #define ARM_LPAE_PTE_SW_SYNC (((arm_lpae_iopte)1) << 55)
  89. /* Stage-1 PTE */
  90. #define ARM_LPAE_PTE_AP_UNPRIV (((arm_lpae_iopte)1) << 6)
  91. #define ARM_LPAE_PTE_AP_RDONLY (((arm_lpae_iopte)2) << 6)
  92. #define ARM_LPAE_PTE_ATTRINDX_SHIFT 2
  93. #define ARM_LPAE_PTE_nG (((arm_lpae_iopte)1) << 11)
  94. /* Stage-2 PTE */
  95. #define ARM_LPAE_PTE_HAP_FAULT (((arm_lpae_iopte)0) << 6)
  96. #define ARM_LPAE_PTE_HAP_READ (((arm_lpae_iopte)1) << 6)
  97. #define ARM_LPAE_PTE_HAP_WRITE (((arm_lpae_iopte)2) << 6)
  98. #define ARM_LPAE_PTE_MEMATTR_OIWB (((arm_lpae_iopte)0xf) << 2)
  99. #define ARM_LPAE_PTE_MEMATTR_NC (((arm_lpae_iopte)0x5) << 2)
  100. #define ARM_LPAE_PTE_MEMATTR_DEV (((arm_lpae_iopte)0x1) << 2)
  101. /* Register bits */
  102. #define ARM_32_LPAE_TCR_EAE (1 << 31)
  103. #define ARM_64_LPAE_S2_TCR_RES1 (1 << 31)
  104. #define ARM_LPAE_TCR_EPD1 (1 << 23)
  105. #define ARM_LPAE_TCR_TG0_4K (0 << 14)
  106. #define ARM_LPAE_TCR_TG0_64K (1 << 14)
  107. #define ARM_LPAE_TCR_TG0_16K (2 << 14)
  108. #define ARM_LPAE_TCR_SH0_SHIFT 12
  109. #define ARM_LPAE_TCR_SH0_MASK 0x3
  110. #define ARM_LPAE_TCR_SH_NS 0
  111. #define ARM_LPAE_TCR_SH_OS 2
  112. #define ARM_LPAE_TCR_SH_IS 3
  113. #define ARM_LPAE_TCR_ORGN0_SHIFT 10
  114. #define ARM_LPAE_TCR_IRGN0_SHIFT 8
  115. #define ARM_LPAE_TCR_RGN_MASK 0x3
  116. #define ARM_LPAE_TCR_RGN_NC 0
  117. #define ARM_LPAE_TCR_RGN_WBWA 1
  118. #define ARM_LPAE_TCR_RGN_WT 2
  119. #define ARM_LPAE_TCR_RGN_WB 3
  120. #define ARM_LPAE_TCR_SL0_SHIFT 6
  121. #define ARM_LPAE_TCR_SL0_MASK 0x3
  122. #define ARM_LPAE_TCR_T0SZ_SHIFT 0
  123. #define ARM_LPAE_TCR_SZ_MASK 0xf
  124. #define ARM_LPAE_TCR_PS_SHIFT 16
  125. #define ARM_LPAE_TCR_PS_MASK 0x7
  126. #define ARM_LPAE_TCR_IPS_SHIFT 32
  127. #define ARM_LPAE_TCR_IPS_MASK 0x7
  128. #define ARM_LPAE_TCR_PS_32_BIT 0x0ULL
  129. #define ARM_LPAE_TCR_PS_36_BIT 0x1ULL
  130. #define ARM_LPAE_TCR_PS_40_BIT 0x2ULL
  131. #define ARM_LPAE_TCR_PS_42_BIT 0x3ULL
  132. #define ARM_LPAE_TCR_PS_44_BIT 0x4ULL
  133. #define ARM_LPAE_TCR_PS_48_BIT 0x5ULL
  134. #define ARM_LPAE_TCR_PS_52_BIT 0x6ULL
  135. #define ARM_LPAE_MAIR_ATTR_SHIFT(n) ((n) << 3)
  136. #define ARM_LPAE_MAIR_ATTR_MASK 0xff
  137. #define ARM_LPAE_MAIR_ATTR_DEVICE 0x04
  138. #define ARM_LPAE_MAIR_ATTR_NC 0x44
  139. #define ARM_LPAE_MAIR_ATTR_WBRWA 0xff
  140. #define ARM_LPAE_MAIR_ATTR_IDX_NC 0
  141. #define ARM_LPAE_MAIR_ATTR_IDX_CACHE 1
  142. #define ARM_LPAE_MAIR_ATTR_IDX_DEV 2
  143. /* IOPTE accessors */
  144. #define iopte_deref(pte,d) __va(iopte_to_paddr(pte, d))
  145. #define iopte_type(pte,l) \
  146. (((pte) >> ARM_LPAE_PTE_TYPE_SHIFT) & ARM_LPAE_PTE_TYPE_MASK)
  147. #define iopte_prot(pte) ((pte) & ARM_LPAE_PTE_ATTR_MASK)
  148. #define iopte_leaf(pte,l) \
  149. (l == (ARM_LPAE_MAX_LEVELS - 1) ? \
  150. (iopte_type(pte,l) == ARM_LPAE_PTE_TYPE_PAGE) : \
  151. (iopte_type(pte,l) == ARM_LPAE_PTE_TYPE_BLOCK))
  152. struct arm_lpae_io_pgtable {
  153. struct io_pgtable iop;
  154. int levels;
  155. size_t pgd_size;
  156. unsigned long pg_shift;
  157. unsigned long bits_per_level;
  158. void *pgd;
  159. };
  160. typedef u64 arm_lpae_iopte;
  161. static arm_lpae_iopte paddr_to_iopte(phys_addr_t paddr,
  162. struct arm_lpae_io_pgtable *data)
  163. {
  164. arm_lpae_iopte pte = paddr;
  165. /* Of the bits which overlap, either 51:48 or 15:12 are always RES0 */
  166. return (pte | (pte >> (48 - 12))) & ARM_LPAE_PTE_ADDR_MASK;
  167. }
  168. static phys_addr_t iopte_to_paddr(arm_lpae_iopte pte,
  169. struct arm_lpae_io_pgtable *data)
  170. {
  171. u64 paddr = pte & ARM_LPAE_PTE_ADDR_MASK;
  172. if (data->pg_shift < 16)
  173. return paddr;
  174. /* Rotate the packed high-order bits back to the top */
  175. return (paddr | (paddr << (48 - 12))) & (ARM_LPAE_PTE_ADDR_MASK << 4);
  176. }
  177. static bool selftest_running = false;
  178. static dma_addr_t __arm_lpae_dma_addr(void *pages)
  179. {
  180. return (dma_addr_t)virt_to_phys(pages);
  181. }
  182. static void *__arm_lpae_alloc_pages(size_t size, gfp_t gfp,
  183. struct io_pgtable_cfg *cfg)
  184. {
  185. struct device *dev = cfg->iommu_dev;
  186. int order = get_order(size);
  187. struct page *p;
  188. dma_addr_t dma;
  189. void *pages;
  190. VM_BUG_ON((gfp & __GFP_HIGHMEM));
  191. p = alloc_pages_node(dev_to_node(dev), gfp | __GFP_ZERO, order);
  192. if (!p)
  193. return NULL;
  194. pages = page_address(p);
  195. if (!(cfg->quirks & IO_PGTABLE_QUIRK_NO_DMA)) {
  196. dma = dma_map_single(dev, pages, size, DMA_TO_DEVICE);
  197. if (dma_mapping_error(dev, dma))
  198. goto out_free;
  199. /*
  200. * We depend on the IOMMU being able to work with any physical
  201. * address directly, so if the DMA layer suggests otherwise by
  202. * translating or truncating them, that bodes very badly...
  203. */
  204. if (dma != virt_to_phys(pages))
  205. goto out_unmap;
  206. }
  207. return pages;
  208. out_unmap:
  209. dev_err(dev, "Cannot accommodate DMA translation for IOMMU page tables\n");
  210. dma_unmap_single(dev, dma, size, DMA_TO_DEVICE);
  211. out_free:
  212. __free_pages(p, order);
  213. return NULL;
  214. }
  215. static void __arm_lpae_free_pages(void *pages, size_t size,
  216. struct io_pgtable_cfg *cfg)
  217. {
  218. if (!(cfg->quirks & IO_PGTABLE_QUIRK_NO_DMA))
  219. dma_unmap_single(cfg->iommu_dev, __arm_lpae_dma_addr(pages),
  220. size, DMA_TO_DEVICE);
  221. free_pages((unsigned long)pages, get_order(size));
  222. }
  223. static void __arm_lpae_sync_pte(arm_lpae_iopte *ptep,
  224. struct io_pgtable_cfg *cfg)
  225. {
  226. dma_sync_single_for_device(cfg->iommu_dev, __arm_lpae_dma_addr(ptep),
  227. sizeof(*ptep), DMA_TO_DEVICE);
  228. }
  229. static void __arm_lpae_set_pte(arm_lpae_iopte *ptep, arm_lpae_iopte pte,
  230. struct io_pgtable_cfg *cfg)
  231. {
  232. *ptep = pte;
  233. if (!(cfg->quirks & IO_PGTABLE_QUIRK_NO_DMA))
  234. __arm_lpae_sync_pte(ptep, cfg);
  235. }
  236. static size_t __arm_lpae_unmap(struct arm_lpae_io_pgtable *data,
  237. unsigned long iova, size_t size, int lvl,
  238. arm_lpae_iopte *ptep);
  239. static void __arm_lpae_init_pte(struct arm_lpae_io_pgtable *data,
  240. phys_addr_t paddr, arm_lpae_iopte prot,
  241. int lvl, arm_lpae_iopte *ptep)
  242. {
  243. arm_lpae_iopte pte = prot;
  244. if (data->iop.cfg.quirks & IO_PGTABLE_QUIRK_ARM_NS)
  245. pte |= ARM_LPAE_PTE_NS;
  246. if (lvl == ARM_LPAE_MAX_LEVELS - 1)
  247. pte |= ARM_LPAE_PTE_TYPE_PAGE;
  248. else
  249. pte |= ARM_LPAE_PTE_TYPE_BLOCK;
  250. pte |= ARM_LPAE_PTE_AF | ARM_LPAE_PTE_SH_IS;
  251. pte |= paddr_to_iopte(paddr, data);
  252. __arm_lpae_set_pte(ptep, pte, &data->iop.cfg);
  253. }
  254. static int arm_lpae_init_pte(struct arm_lpae_io_pgtable *data,
  255. unsigned long iova, phys_addr_t paddr,
  256. arm_lpae_iopte prot, int lvl,
  257. arm_lpae_iopte *ptep)
  258. {
  259. arm_lpae_iopte pte = *ptep;
  260. if (iopte_leaf(pte, lvl)) {
  261. /* We require an unmap first */
  262. WARN_ON(!selftest_running);
  263. return -EEXIST;
  264. } else if (iopte_type(pte, lvl) == ARM_LPAE_PTE_TYPE_TABLE) {
  265. /*
  266. * We need to unmap and free the old table before
  267. * overwriting it with a block entry.
  268. */
  269. arm_lpae_iopte *tblp;
  270. size_t sz = ARM_LPAE_BLOCK_SIZE(lvl, data);
  271. tblp = ptep - ARM_LPAE_LVL_IDX(iova, lvl, data);
  272. if (WARN_ON(__arm_lpae_unmap(data, iova, sz, lvl, tblp) != sz))
  273. return -EINVAL;
  274. }
  275. __arm_lpae_init_pte(data, paddr, prot, lvl, ptep);
  276. return 0;
  277. }
  278. static arm_lpae_iopte arm_lpae_install_table(arm_lpae_iopte *table,
  279. arm_lpae_iopte *ptep,
  280. arm_lpae_iopte curr,
  281. struct io_pgtable_cfg *cfg)
  282. {
  283. arm_lpae_iopte old, new;
  284. new = __pa(table) | ARM_LPAE_PTE_TYPE_TABLE;
  285. if (cfg->quirks & IO_PGTABLE_QUIRK_ARM_NS)
  286. new |= ARM_LPAE_PTE_NSTABLE;
  287. /*
  288. * Ensure the table itself is visible before its PTE can be.
  289. * Whilst we could get away with cmpxchg64_release below, this
  290. * doesn't have any ordering semantics when !CONFIG_SMP.
  291. */
  292. dma_wmb();
  293. old = cmpxchg64_relaxed(ptep, curr, new);
  294. if ((cfg->quirks & IO_PGTABLE_QUIRK_NO_DMA) ||
  295. (old & ARM_LPAE_PTE_SW_SYNC))
  296. return old;
  297. /* Even if it's not ours, there's no point waiting; just kick it */
  298. __arm_lpae_sync_pte(ptep, cfg);
  299. if (old == curr)
  300. WRITE_ONCE(*ptep, new | ARM_LPAE_PTE_SW_SYNC);
  301. return old;
  302. }
  303. static int __arm_lpae_map(struct arm_lpae_io_pgtable *data, unsigned long iova,
  304. phys_addr_t paddr, size_t size, arm_lpae_iopte prot,
  305. int lvl, arm_lpae_iopte *ptep)
  306. {
  307. arm_lpae_iopte *cptep, pte;
  308. size_t block_size = ARM_LPAE_BLOCK_SIZE(lvl, data);
  309. size_t tblsz = ARM_LPAE_GRANULE(data);
  310. struct io_pgtable_cfg *cfg = &data->iop.cfg;
  311. /* Find our entry at the current level */
  312. ptep += ARM_LPAE_LVL_IDX(iova, lvl, data);
  313. /* If we can install a leaf entry at this level, then do so */
  314. if (size == block_size && (size & cfg->pgsize_bitmap))
  315. return arm_lpae_init_pte(data, iova, paddr, prot, lvl, ptep);
  316. /* We can't allocate tables at the final level */
  317. if (WARN_ON(lvl >= ARM_LPAE_MAX_LEVELS - 1))
  318. return -EINVAL;
  319. /* Grab a pointer to the next level */
  320. pte = READ_ONCE(*ptep);
  321. if (!pte) {
  322. cptep = __arm_lpae_alloc_pages(tblsz, GFP_ATOMIC, cfg);
  323. if (!cptep)
  324. return -ENOMEM;
  325. pte = arm_lpae_install_table(cptep, ptep, 0, cfg);
  326. if (pte)
  327. __arm_lpae_free_pages(cptep, tblsz, cfg);
  328. } else if (!(cfg->quirks & IO_PGTABLE_QUIRK_NO_DMA) &&
  329. !(pte & ARM_LPAE_PTE_SW_SYNC)) {
  330. __arm_lpae_sync_pte(ptep, cfg);
  331. }
  332. if (pte && !iopte_leaf(pte, lvl)) {
  333. cptep = iopte_deref(pte, data);
  334. } else if (pte) {
  335. /* We require an unmap first */
  336. WARN_ON(!selftest_running);
  337. return -EEXIST;
  338. }
  339. /* Rinse, repeat */
  340. return __arm_lpae_map(data, iova, paddr, size, prot, lvl + 1, cptep);
  341. }
  342. static arm_lpae_iopte arm_lpae_prot_to_pte(struct arm_lpae_io_pgtable *data,
  343. int prot)
  344. {
  345. arm_lpae_iopte pte;
  346. if (data->iop.fmt == ARM_64_LPAE_S1 ||
  347. data->iop.fmt == ARM_32_LPAE_S1) {
  348. pte = ARM_LPAE_PTE_nG;
  349. if (!(prot & IOMMU_WRITE) && (prot & IOMMU_READ))
  350. pte |= ARM_LPAE_PTE_AP_RDONLY;
  351. if (!(prot & IOMMU_PRIV))
  352. pte |= ARM_LPAE_PTE_AP_UNPRIV;
  353. if (prot & IOMMU_MMIO)
  354. pte |= (ARM_LPAE_MAIR_ATTR_IDX_DEV
  355. << ARM_LPAE_PTE_ATTRINDX_SHIFT);
  356. else if (prot & IOMMU_CACHE)
  357. pte |= (ARM_LPAE_MAIR_ATTR_IDX_CACHE
  358. << ARM_LPAE_PTE_ATTRINDX_SHIFT);
  359. } else {
  360. pte = ARM_LPAE_PTE_HAP_FAULT;
  361. if (prot & IOMMU_READ)
  362. pte |= ARM_LPAE_PTE_HAP_READ;
  363. if (prot & IOMMU_WRITE)
  364. pte |= ARM_LPAE_PTE_HAP_WRITE;
  365. if (prot & IOMMU_MMIO)
  366. pte |= ARM_LPAE_PTE_MEMATTR_DEV;
  367. else if (prot & IOMMU_CACHE)
  368. pte |= ARM_LPAE_PTE_MEMATTR_OIWB;
  369. else
  370. pte |= ARM_LPAE_PTE_MEMATTR_NC;
  371. }
  372. if (prot & IOMMU_NOEXEC)
  373. pte |= ARM_LPAE_PTE_XN;
  374. return pte;
  375. }
  376. static int arm_lpae_map(struct io_pgtable_ops *ops, unsigned long iova,
  377. phys_addr_t paddr, size_t size, int iommu_prot)
  378. {
  379. struct arm_lpae_io_pgtable *data = io_pgtable_ops_to_data(ops);
  380. arm_lpae_iopte *ptep = data->pgd;
  381. int ret, lvl = ARM_LPAE_START_LVL(data);
  382. arm_lpae_iopte prot;
  383. /* If no access, then nothing to do */
  384. if (!(iommu_prot & (IOMMU_READ | IOMMU_WRITE)))
  385. return 0;
  386. if (WARN_ON(iova >= (1ULL << data->iop.cfg.ias) ||
  387. paddr >= (1ULL << data->iop.cfg.oas)))
  388. return -ERANGE;
  389. prot = arm_lpae_prot_to_pte(data, iommu_prot);
  390. ret = __arm_lpae_map(data, iova, paddr, size, prot, lvl, ptep);
  391. /*
  392. * Synchronise all PTE updates for the new mapping before there's
  393. * a chance for anything to kick off a table walk for the new iova.
  394. */
  395. wmb();
  396. return ret;
  397. }
  398. static void __arm_lpae_free_pgtable(struct arm_lpae_io_pgtable *data, int lvl,
  399. arm_lpae_iopte *ptep)
  400. {
  401. arm_lpae_iopte *start, *end;
  402. unsigned long table_size;
  403. if (lvl == ARM_LPAE_START_LVL(data))
  404. table_size = data->pgd_size;
  405. else
  406. table_size = ARM_LPAE_GRANULE(data);
  407. start = ptep;
  408. /* Only leaf entries at the last level */
  409. if (lvl == ARM_LPAE_MAX_LEVELS - 1)
  410. end = ptep;
  411. else
  412. end = (void *)ptep + table_size;
  413. while (ptep != end) {
  414. arm_lpae_iopte pte = *ptep++;
  415. if (!pte || iopte_leaf(pte, lvl))
  416. continue;
  417. __arm_lpae_free_pgtable(data, lvl + 1, iopte_deref(pte, data));
  418. }
  419. __arm_lpae_free_pages(start, table_size, &data->iop.cfg);
  420. }
  421. static void arm_lpae_free_pgtable(struct io_pgtable *iop)
  422. {
  423. struct arm_lpae_io_pgtable *data = io_pgtable_to_data(iop);
  424. __arm_lpae_free_pgtable(data, ARM_LPAE_START_LVL(data), data->pgd);
  425. kfree(data);
  426. }
  427. static size_t arm_lpae_split_blk_unmap(struct arm_lpae_io_pgtable *data,
  428. unsigned long iova, size_t size,
  429. arm_lpae_iopte blk_pte, int lvl,
  430. arm_lpae_iopte *ptep)
  431. {
  432. struct io_pgtable_cfg *cfg = &data->iop.cfg;
  433. arm_lpae_iopte pte, *tablep;
  434. phys_addr_t blk_paddr;
  435. size_t tablesz = ARM_LPAE_GRANULE(data);
  436. size_t split_sz = ARM_LPAE_BLOCK_SIZE(lvl, data);
  437. int i, unmap_idx = -1;
  438. if (WARN_ON(lvl == ARM_LPAE_MAX_LEVELS))
  439. return 0;
  440. tablep = __arm_lpae_alloc_pages(tablesz, GFP_ATOMIC, cfg);
  441. if (!tablep)
  442. return 0; /* Bytes unmapped */
  443. if (size == split_sz)
  444. unmap_idx = ARM_LPAE_LVL_IDX(iova, lvl, data);
  445. blk_paddr = iopte_to_paddr(blk_pte, data);
  446. pte = iopte_prot(blk_pte);
  447. for (i = 0; i < tablesz / sizeof(pte); i++, blk_paddr += split_sz) {
  448. /* Unmap! */
  449. if (i == unmap_idx)
  450. continue;
  451. __arm_lpae_init_pte(data, blk_paddr, pte, lvl, &tablep[i]);
  452. }
  453. pte = arm_lpae_install_table(tablep, ptep, blk_pte, cfg);
  454. if (pte != blk_pte) {
  455. __arm_lpae_free_pages(tablep, tablesz, cfg);
  456. /*
  457. * We may race against someone unmapping another part of this
  458. * block, but anything else is invalid. We can't misinterpret
  459. * a page entry here since we're never at the last level.
  460. */
  461. if (iopte_type(pte, lvl - 1) != ARM_LPAE_PTE_TYPE_TABLE)
  462. return 0;
  463. tablep = iopte_deref(pte, data);
  464. }
  465. if (unmap_idx < 0)
  466. return __arm_lpae_unmap(data, iova, size, lvl, tablep);
  467. io_pgtable_tlb_add_flush(&data->iop, iova, size, size, true);
  468. return size;
  469. }
  470. static size_t __arm_lpae_unmap(struct arm_lpae_io_pgtable *data,
  471. unsigned long iova, size_t size, int lvl,
  472. arm_lpae_iopte *ptep)
  473. {
  474. arm_lpae_iopte pte;
  475. struct io_pgtable *iop = &data->iop;
  476. /* Something went horribly wrong and we ran out of page table */
  477. if (WARN_ON(lvl == ARM_LPAE_MAX_LEVELS))
  478. return 0;
  479. ptep += ARM_LPAE_LVL_IDX(iova, lvl, data);
  480. pte = READ_ONCE(*ptep);
  481. if (WARN_ON(!pte))
  482. return 0;
  483. /* If the size matches this level, we're in the right place */
  484. if (size == ARM_LPAE_BLOCK_SIZE(lvl, data)) {
  485. __arm_lpae_set_pte(ptep, 0, &iop->cfg);
  486. if (!iopte_leaf(pte, lvl)) {
  487. /* Also flush any partial walks */
  488. io_pgtable_tlb_add_flush(iop, iova, size,
  489. ARM_LPAE_GRANULE(data), false);
  490. io_pgtable_tlb_sync(iop);
  491. ptep = iopte_deref(pte, data);
  492. __arm_lpae_free_pgtable(data, lvl + 1, ptep);
  493. } else {
  494. io_pgtable_tlb_add_flush(iop, iova, size, size, true);
  495. }
  496. return size;
  497. } else if (iopte_leaf(pte, lvl)) {
  498. /*
  499. * Insert a table at the next level to map the old region,
  500. * minus the part we want to unmap
  501. */
  502. return arm_lpae_split_blk_unmap(data, iova, size, pte,
  503. lvl + 1, ptep);
  504. }
  505. /* Keep on walkin' */
  506. ptep = iopte_deref(pte, data);
  507. return __arm_lpae_unmap(data, iova, size, lvl + 1, ptep);
  508. }
  509. static size_t arm_lpae_unmap(struct io_pgtable_ops *ops, unsigned long iova,
  510. size_t size)
  511. {
  512. struct arm_lpae_io_pgtable *data = io_pgtable_ops_to_data(ops);
  513. arm_lpae_iopte *ptep = data->pgd;
  514. int lvl = ARM_LPAE_START_LVL(data);
  515. if (WARN_ON(iova >= (1ULL << data->iop.cfg.ias)))
  516. return 0;
  517. return __arm_lpae_unmap(data, iova, size, lvl, ptep);
  518. }
  519. static phys_addr_t arm_lpae_iova_to_phys(struct io_pgtable_ops *ops,
  520. unsigned long iova)
  521. {
  522. struct arm_lpae_io_pgtable *data = io_pgtable_ops_to_data(ops);
  523. arm_lpae_iopte pte, *ptep = data->pgd;
  524. int lvl = ARM_LPAE_START_LVL(data);
  525. do {
  526. /* Valid IOPTE pointer? */
  527. if (!ptep)
  528. return 0;
  529. /* Grab the IOPTE we're interested in */
  530. ptep += ARM_LPAE_LVL_IDX(iova, lvl, data);
  531. pte = READ_ONCE(*ptep);
  532. /* Valid entry? */
  533. if (!pte)
  534. return 0;
  535. /* Leaf entry? */
  536. if (iopte_leaf(pte,lvl))
  537. goto found_translation;
  538. /* Take it to the next level */
  539. ptep = iopte_deref(pte, data);
  540. } while (++lvl < ARM_LPAE_MAX_LEVELS);
  541. /* Ran out of page tables to walk */
  542. return 0;
  543. found_translation:
  544. iova &= (ARM_LPAE_BLOCK_SIZE(lvl, data) - 1);
  545. return iopte_to_paddr(pte, data) | iova;
  546. }
  547. static void arm_lpae_restrict_pgsizes(struct io_pgtable_cfg *cfg)
  548. {
  549. unsigned long granule, page_sizes;
  550. unsigned int max_addr_bits = 48;
  551. /*
  552. * We need to restrict the supported page sizes to match the
  553. * translation regime for a particular granule. Aim to match
  554. * the CPU page size if possible, otherwise prefer smaller sizes.
  555. * While we're at it, restrict the block sizes to match the
  556. * chosen granule.
  557. */
  558. if (cfg->pgsize_bitmap & PAGE_SIZE)
  559. granule = PAGE_SIZE;
  560. else if (cfg->pgsize_bitmap & ~PAGE_MASK)
  561. granule = 1UL << __fls(cfg->pgsize_bitmap & ~PAGE_MASK);
  562. else if (cfg->pgsize_bitmap & PAGE_MASK)
  563. granule = 1UL << __ffs(cfg->pgsize_bitmap & PAGE_MASK);
  564. else
  565. granule = 0;
  566. switch (granule) {
  567. case SZ_4K:
  568. page_sizes = (SZ_4K | SZ_2M | SZ_1G);
  569. break;
  570. case SZ_16K:
  571. page_sizes = (SZ_16K | SZ_32M);
  572. break;
  573. case SZ_64K:
  574. max_addr_bits = 52;
  575. page_sizes = (SZ_64K | SZ_512M);
  576. if (cfg->oas > 48)
  577. page_sizes |= 1ULL << 42; /* 4TB */
  578. break;
  579. default:
  580. page_sizes = 0;
  581. }
  582. cfg->pgsize_bitmap &= page_sizes;
  583. cfg->ias = min(cfg->ias, max_addr_bits);
  584. cfg->oas = min(cfg->oas, max_addr_bits);
  585. }
  586. static struct arm_lpae_io_pgtable *
  587. arm_lpae_alloc_pgtable(struct io_pgtable_cfg *cfg)
  588. {
  589. unsigned long va_bits, pgd_bits;
  590. struct arm_lpae_io_pgtable *data;
  591. arm_lpae_restrict_pgsizes(cfg);
  592. if (!(cfg->pgsize_bitmap & (SZ_4K | SZ_16K | SZ_64K)))
  593. return NULL;
  594. if (cfg->ias > ARM_LPAE_MAX_ADDR_BITS)
  595. return NULL;
  596. if (cfg->oas > ARM_LPAE_MAX_ADDR_BITS)
  597. return NULL;
  598. if (!selftest_running && cfg->iommu_dev->dma_pfn_offset) {
  599. dev_err(cfg->iommu_dev, "Cannot accommodate DMA offset for IOMMU page tables\n");
  600. return NULL;
  601. }
  602. data = kmalloc(sizeof(*data), GFP_KERNEL);
  603. if (!data)
  604. return NULL;
  605. data->pg_shift = __ffs(cfg->pgsize_bitmap);
  606. data->bits_per_level = data->pg_shift - ilog2(sizeof(arm_lpae_iopte));
  607. va_bits = cfg->ias - data->pg_shift;
  608. data->levels = DIV_ROUND_UP(va_bits, data->bits_per_level);
  609. /* Calculate the actual size of our pgd (without concatenation) */
  610. pgd_bits = va_bits - (data->bits_per_level * (data->levels - 1));
  611. data->pgd_size = 1UL << (pgd_bits + ilog2(sizeof(arm_lpae_iopte)));
  612. data->iop.ops = (struct io_pgtable_ops) {
  613. .map = arm_lpae_map,
  614. .unmap = arm_lpae_unmap,
  615. .iova_to_phys = arm_lpae_iova_to_phys,
  616. };
  617. return data;
  618. }
  619. static struct io_pgtable *
  620. arm_64_lpae_alloc_pgtable_s1(struct io_pgtable_cfg *cfg, void *cookie)
  621. {
  622. u64 reg;
  623. struct arm_lpae_io_pgtable *data;
  624. if (cfg->quirks & ~(IO_PGTABLE_QUIRK_ARM_NS | IO_PGTABLE_QUIRK_NO_DMA))
  625. return NULL;
  626. data = arm_lpae_alloc_pgtable(cfg);
  627. if (!data)
  628. return NULL;
  629. /* TCR */
  630. reg = (ARM_LPAE_TCR_SH_IS << ARM_LPAE_TCR_SH0_SHIFT) |
  631. (ARM_LPAE_TCR_RGN_WBWA << ARM_LPAE_TCR_IRGN0_SHIFT) |
  632. (ARM_LPAE_TCR_RGN_WBWA << ARM_LPAE_TCR_ORGN0_SHIFT);
  633. switch (ARM_LPAE_GRANULE(data)) {
  634. case SZ_4K:
  635. reg |= ARM_LPAE_TCR_TG0_4K;
  636. break;
  637. case SZ_16K:
  638. reg |= ARM_LPAE_TCR_TG0_16K;
  639. break;
  640. case SZ_64K:
  641. reg |= ARM_LPAE_TCR_TG0_64K;
  642. break;
  643. }
  644. switch (cfg->oas) {
  645. case 32:
  646. reg |= (ARM_LPAE_TCR_PS_32_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  647. break;
  648. case 36:
  649. reg |= (ARM_LPAE_TCR_PS_36_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  650. break;
  651. case 40:
  652. reg |= (ARM_LPAE_TCR_PS_40_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  653. break;
  654. case 42:
  655. reg |= (ARM_LPAE_TCR_PS_42_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  656. break;
  657. case 44:
  658. reg |= (ARM_LPAE_TCR_PS_44_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  659. break;
  660. case 48:
  661. reg |= (ARM_LPAE_TCR_PS_48_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  662. break;
  663. case 52:
  664. reg |= (ARM_LPAE_TCR_PS_52_BIT << ARM_LPAE_TCR_IPS_SHIFT);
  665. break;
  666. default:
  667. goto out_free_data;
  668. }
  669. reg |= (64ULL - cfg->ias) << ARM_LPAE_TCR_T0SZ_SHIFT;
  670. /* Disable speculative walks through TTBR1 */
  671. reg |= ARM_LPAE_TCR_EPD1;
  672. cfg->arm_lpae_s1_cfg.tcr = reg;
  673. /* MAIRs */
  674. reg = (ARM_LPAE_MAIR_ATTR_NC
  675. << ARM_LPAE_MAIR_ATTR_SHIFT(ARM_LPAE_MAIR_ATTR_IDX_NC)) |
  676. (ARM_LPAE_MAIR_ATTR_WBRWA
  677. << ARM_LPAE_MAIR_ATTR_SHIFT(ARM_LPAE_MAIR_ATTR_IDX_CACHE)) |
  678. (ARM_LPAE_MAIR_ATTR_DEVICE
  679. << ARM_LPAE_MAIR_ATTR_SHIFT(ARM_LPAE_MAIR_ATTR_IDX_DEV));
  680. cfg->arm_lpae_s1_cfg.mair[0] = reg;
  681. cfg->arm_lpae_s1_cfg.mair[1] = 0;
  682. /* Looking good; allocate a pgd */
  683. data->pgd = __arm_lpae_alloc_pages(data->pgd_size, GFP_KERNEL, cfg);
  684. if (!data->pgd)
  685. goto out_free_data;
  686. /* Ensure the empty pgd is visible before any actual TTBR write */
  687. wmb();
  688. /* TTBRs */
  689. cfg->arm_lpae_s1_cfg.ttbr[0] = virt_to_phys(data->pgd);
  690. cfg->arm_lpae_s1_cfg.ttbr[1] = 0;
  691. return &data->iop;
  692. out_free_data:
  693. kfree(data);
  694. return NULL;
  695. }
  696. static struct io_pgtable *
  697. arm_64_lpae_alloc_pgtable_s2(struct io_pgtable_cfg *cfg, void *cookie)
  698. {
  699. u64 reg, sl;
  700. struct arm_lpae_io_pgtable *data;
  701. /* The NS quirk doesn't apply at stage 2 */
  702. if (cfg->quirks & ~IO_PGTABLE_QUIRK_NO_DMA)
  703. return NULL;
  704. data = arm_lpae_alloc_pgtable(cfg);
  705. if (!data)
  706. return NULL;
  707. /*
  708. * Concatenate PGDs at level 1 if possible in order to reduce
  709. * the depth of the stage-2 walk.
  710. */
  711. if (data->levels == ARM_LPAE_MAX_LEVELS) {
  712. unsigned long pgd_pages;
  713. pgd_pages = data->pgd_size >> ilog2(sizeof(arm_lpae_iopte));
  714. if (pgd_pages <= ARM_LPAE_S2_MAX_CONCAT_PAGES) {
  715. data->pgd_size = pgd_pages << data->pg_shift;
  716. data->levels--;
  717. }
  718. }
  719. /* VTCR */
  720. reg = ARM_64_LPAE_S2_TCR_RES1 |
  721. (ARM_LPAE_TCR_SH_IS << ARM_LPAE_TCR_SH0_SHIFT) |
  722. (ARM_LPAE_TCR_RGN_WBWA << ARM_LPAE_TCR_IRGN0_SHIFT) |
  723. (ARM_LPAE_TCR_RGN_WBWA << ARM_LPAE_TCR_ORGN0_SHIFT);
  724. sl = ARM_LPAE_START_LVL(data);
  725. switch (ARM_LPAE_GRANULE(data)) {
  726. case SZ_4K:
  727. reg |= ARM_LPAE_TCR_TG0_4K;
  728. sl++; /* SL0 format is different for 4K granule size */
  729. break;
  730. case SZ_16K:
  731. reg |= ARM_LPAE_TCR_TG0_16K;
  732. break;
  733. case SZ_64K:
  734. reg |= ARM_LPAE_TCR_TG0_64K;
  735. break;
  736. }
  737. switch (cfg->oas) {
  738. case 32:
  739. reg |= (ARM_LPAE_TCR_PS_32_BIT << ARM_LPAE_TCR_PS_SHIFT);
  740. break;
  741. case 36:
  742. reg |= (ARM_LPAE_TCR_PS_36_BIT << ARM_LPAE_TCR_PS_SHIFT);
  743. break;
  744. case 40:
  745. reg |= (ARM_LPAE_TCR_PS_40_BIT << ARM_LPAE_TCR_PS_SHIFT);
  746. break;
  747. case 42:
  748. reg |= (ARM_LPAE_TCR_PS_42_BIT << ARM_LPAE_TCR_PS_SHIFT);
  749. break;
  750. case 44:
  751. reg |= (ARM_LPAE_TCR_PS_44_BIT << ARM_LPAE_TCR_PS_SHIFT);
  752. break;
  753. case 48:
  754. reg |= (ARM_LPAE_TCR_PS_48_BIT << ARM_LPAE_TCR_PS_SHIFT);
  755. break;
  756. case 52:
  757. reg |= (ARM_LPAE_TCR_PS_52_BIT << ARM_LPAE_TCR_PS_SHIFT);
  758. break;
  759. default:
  760. goto out_free_data;
  761. }
  762. reg |= (64ULL - cfg->ias) << ARM_LPAE_TCR_T0SZ_SHIFT;
  763. reg |= (~sl & ARM_LPAE_TCR_SL0_MASK) << ARM_LPAE_TCR_SL0_SHIFT;
  764. cfg->arm_lpae_s2_cfg.vtcr = reg;
  765. /* Allocate pgd pages */
  766. data->pgd = __arm_lpae_alloc_pages(data->pgd_size, GFP_KERNEL, cfg);
  767. if (!data->pgd)
  768. goto out_free_data;
  769. /* Ensure the empty pgd is visible before any actual TTBR write */
  770. wmb();
  771. /* VTTBR */
  772. cfg->arm_lpae_s2_cfg.vttbr = virt_to_phys(data->pgd);
  773. return &data->iop;
  774. out_free_data:
  775. kfree(data);
  776. return NULL;
  777. }
  778. static struct io_pgtable *
  779. arm_32_lpae_alloc_pgtable_s1(struct io_pgtable_cfg *cfg, void *cookie)
  780. {
  781. struct io_pgtable *iop;
  782. if (cfg->ias > 32 || cfg->oas > 40)
  783. return NULL;
  784. cfg->pgsize_bitmap &= (SZ_4K | SZ_2M | SZ_1G);
  785. iop = arm_64_lpae_alloc_pgtable_s1(cfg, cookie);
  786. if (iop) {
  787. cfg->arm_lpae_s1_cfg.tcr |= ARM_32_LPAE_TCR_EAE;
  788. cfg->arm_lpae_s1_cfg.tcr &= 0xffffffff;
  789. }
  790. return iop;
  791. }
  792. static struct io_pgtable *
  793. arm_32_lpae_alloc_pgtable_s2(struct io_pgtable_cfg *cfg, void *cookie)
  794. {
  795. struct io_pgtable *iop;
  796. if (cfg->ias > 40 || cfg->oas > 40)
  797. return NULL;
  798. cfg->pgsize_bitmap &= (SZ_4K | SZ_2M | SZ_1G);
  799. iop = arm_64_lpae_alloc_pgtable_s2(cfg, cookie);
  800. if (iop)
  801. cfg->arm_lpae_s2_cfg.vtcr &= 0xffffffff;
  802. return iop;
  803. }
  804. struct io_pgtable_init_fns io_pgtable_arm_64_lpae_s1_init_fns = {
  805. .alloc = arm_64_lpae_alloc_pgtable_s1,
  806. .free = arm_lpae_free_pgtable,
  807. };
  808. struct io_pgtable_init_fns io_pgtable_arm_64_lpae_s2_init_fns = {
  809. .alloc = arm_64_lpae_alloc_pgtable_s2,
  810. .free = arm_lpae_free_pgtable,
  811. };
  812. struct io_pgtable_init_fns io_pgtable_arm_32_lpae_s1_init_fns = {
  813. .alloc = arm_32_lpae_alloc_pgtable_s1,
  814. .free = arm_lpae_free_pgtable,
  815. };
  816. struct io_pgtable_init_fns io_pgtable_arm_32_lpae_s2_init_fns = {
  817. .alloc = arm_32_lpae_alloc_pgtable_s2,
  818. .free = arm_lpae_free_pgtable,
  819. };
  820. #ifdef CONFIG_IOMMU_IO_PGTABLE_LPAE_SELFTEST
  821. static struct io_pgtable_cfg *cfg_cookie;
  822. static void dummy_tlb_flush_all(void *cookie)
  823. {
  824. WARN_ON(cookie != cfg_cookie);
  825. }
  826. static void dummy_tlb_add_flush(unsigned long iova, size_t size,
  827. size_t granule, bool leaf, void *cookie)
  828. {
  829. WARN_ON(cookie != cfg_cookie);
  830. WARN_ON(!(size & cfg_cookie->pgsize_bitmap));
  831. }
  832. static void dummy_tlb_sync(void *cookie)
  833. {
  834. WARN_ON(cookie != cfg_cookie);
  835. }
  836. static const struct iommu_gather_ops dummy_tlb_ops __initconst = {
  837. .tlb_flush_all = dummy_tlb_flush_all,
  838. .tlb_add_flush = dummy_tlb_add_flush,
  839. .tlb_sync = dummy_tlb_sync,
  840. };
  841. static void __init arm_lpae_dump_ops(struct io_pgtable_ops *ops)
  842. {
  843. struct arm_lpae_io_pgtable *data = io_pgtable_ops_to_data(ops);
  844. struct io_pgtable_cfg *cfg = &data->iop.cfg;
  845. pr_err("cfg: pgsize_bitmap 0x%lx, ias %u-bit\n",
  846. cfg->pgsize_bitmap, cfg->ias);
  847. pr_err("data: %d levels, 0x%zx pgd_size, %lu pg_shift, %lu bits_per_level, pgd @ %p\n",
  848. data->levels, data->pgd_size, data->pg_shift,
  849. data->bits_per_level, data->pgd);
  850. }
  851. #define __FAIL(ops, i) ({ \
  852. WARN(1, "selftest: test failed for fmt idx %d\n", (i)); \
  853. arm_lpae_dump_ops(ops); \
  854. selftest_running = false; \
  855. -EFAULT; \
  856. })
  857. static int __init arm_lpae_run_tests(struct io_pgtable_cfg *cfg)
  858. {
  859. static const enum io_pgtable_fmt fmts[] = {
  860. ARM_64_LPAE_S1,
  861. ARM_64_LPAE_S2,
  862. };
  863. int i, j;
  864. unsigned long iova;
  865. size_t size;
  866. struct io_pgtable_ops *ops;
  867. selftest_running = true;
  868. for (i = 0; i < ARRAY_SIZE(fmts); ++i) {
  869. cfg_cookie = cfg;
  870. ops = alloc_io_pgtable_ops(fmts[i], cfg, cfg);
  871. if (!ops) {
  872. pr_err("selftest: failed to allocate io pgtable ops\n");
  873. return -ENOMEM;
  874. }
  875. /*
  876. * Initial sanity checks.
  877. * Empty page tables shouldn't provide any translations.
  878. */
  879. if (ops->iova_to_phys(ops, 42))
  880. return __FAIL(ops, i);
  881. if (ops->iova_to_phys(ops, SZ_1G + 42))
  882. return __FAIL(ops, i);
  883. if (ops->iova_to_phys(ops, SZ_2G + 42))
  884. return __FAIL(ops, i);
  885. /*
  886. * Distinct mappings of different granule sizes.
  887. */
  888. iova = 0;
  889. for_each_set_bit(j, &cfg->pgsize_bitmap, BITS_PER_LONG) {
  890. size = 1UL << j;
  891. if (ops->map(ops, iova, iova, size, IOMMU_READ |
  892. IOMMU_WRITE |
  893. IOMMU_NOEXEC |
  894. IOMMU_CACHE))
  895. return __FAIL(ops, i);
  896. /* Overlapping mappings */
  897. if (!ops->map(ops, iova, iova + size, size,
  898. IOMMU_READ | IOMMU_NOEXEC))
  899. return __FAIL(ops, i);
  900. if (ops->iova_to_phys(ops, iova + 42) != (iova + 42))
  901. return __FAIL(ops, i);
  902. iova += SZ_1G;
  903. }
  904. /* Partial unmap */
  905. size = 1UL << __ffs(cfg->pgsize_bitmap);
  906. if (ops->unmap(ops, SZ_1G + size, size) != size)
  907. return __FAIL(ops, i);
  908. /* Remap of partial unmap */
  909. if (ops->map(ops, SZ_1G + size, size, size, IOMMU_READ))
  910. return __FAIL(ops, i);
  911. if (ops->iova_to_phys(ops, SZ_1G + size + 42) != (size + 42))
  912. return __FAIL(ops, i);
  913. /* Full unmap */
  914. iova = 0;
  915. for_each_set_bit(j, &cfg->pgsize_bitmap, BITS_PER_LONG) {
  916. size = 1UL << j;
  917. if (ops->unmap(ops, iova, size) != size)
  918. return __FAIL(ops, i);
  919. if (ops->iova_to_phys(ops, iova + 42))
  920. return __FAIL(ops, i);
  921. /* Remap full block */
  922. if (ops->map(ops, iova, iova, size, IOMMU_WRITE))
  923. return __FAIL(ops, i);
  924. if (ops->iova_to_phys(ops, iova + 42) != (iova + 42))
  925. return __FAIL(ops, i);
  926. iova += SZ_1G;
  927. }
  928. free_io_pgtable_ops(ops);
  929. }
  930. selftest_running = false;
  931. return 0;
  932. }
  933. static int __init arm_lpae_do_selftests(void)
  934. {
  935. static const unsigned long pgsize[] = {
  936. SZ_4K | SZ_2M | SZ_1G,
  937. SZ_16K | SZ_32M,
  938. SZ_64K | SZ_512M,
  939. };
  940. static const unsigned int ias[] = {
  941. 32, 36, 40, 42, 44, 48,
  942. };
  943. int i, j, pass = 0, fail = 0;
  944. struct io_pgtable_cfg cfg = {
  945. .tlb = &dummy_tlb_ops,
  946. .oas = 48,
  947. .quirks = IO_PGTABLE_QUIRK_NO_DMA,
  948. };
  949. for (i = 0; i < ARRAY_SIZE(pgsize); ++i) {
  950. for (j = 0; j < ARRAY_SIZE(ias); ++j) {
  951. cfg.pgsize_bitmap = pgsize[i];
  952. cfg.ias = ias[j];
  953. pr_info("selftest: pgsize_bitmap 0x%08lx, IAS %u\n",
  954. pgsize[i], ias[j]);
  955. if (arm_lpae_run_tests(&cfg))
  956. fail++;
  957. else
  958. pass++;
  959. }
  960. }
  961. pr_info("selftest: completed with %d PASS %d FAIL\n", pass, fail);
  962. return fail ? -EFAULT : 0;
  963. }
  964. subsys_initcall(arm_lpae_do_selftests);
  965. #endif