adreno_gpu.c 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742
  1. /*
  2. * Copyright (C) 2013 Red Hat
  3. * Author: Rob Clark <robdclark@gmail.com>
  4. *
  5. * Copyright (c) 2014 The Linux Foundation. All rights reserved.
  6. *
  7. * This program is free software; you can redistribute it and/or modify it
  8. * under the terms of the GNU General Public License version 2 as published by
  9. * the Free Software Foundation.
  10. *
  11. * This program is distributed in the hope that it will be useful, but WITHOUT
  12. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  14. * more details.
  15. *
  16. * You should have received a copy of the GNU General Public License along with
  17. * this program. If not, see <http://www.gnu.org/licenses/>.
  18. */
  19. #include <linux/ascii85.h>
  20. #include <linux/kernel.h>
  21. #include <linux/pm_opp.h>
  22. #include <linux/slab.h>
  23. #include "adreno_gpu.h"
  24. #include "msm_gem.h"
  25. #include "msm_mmu.h"
  26. int adreno_get_param(struct msm_gpu *gpu, uint32_t param, uint64_t *value)
  27. {
  28. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  29. switch (param) {
  30. case MSM_PARAM_GPU_ID:
  31. *value = adreno_gpu->info->revn;
  32. return 0;
  33. case MSM_PARAM_GMEM_SIZE:
  34. *value = adreno_gpu->gmem;
  35. return 0;
  36. case MSM_PARAM_GMEM_BASE:
  37. *value = 0x100000;
  38. return 0;
  39. case MSM_PARAM_CHIP_ID:
  40. *value = adreno_gpu->rev.patchid |
  41. (adreno_gpu->rev.minor << 8) |
  42. (adreno_gpu->rev.major << 16) |
  43. (adreno_gpu->rev.core << 24);
  44. return 0;
  45. case MSM_PARAM_MAX_FREQ:
  46. *value = adreno_gpu->base.fast_rate;
  47. return 0;
  48. case MSM_PARAM_TIMESTAMP:
  49. if (adreno_gpu->funcs->get_timestamp) {
  50. int ret;
  51. pm_runtime_get_sync(&gpu->pdev->dev);
  52. ret = adreno_gpu->funcs->get_timestamp(gpu, value);
  53. pm_runtime_put_autosuspend(&gpu->pdev->dev);
  54. return ret;
  55. }
  56. return -EINVAL;
  57. case MSM_PARAM_NR_RINGS:
  58. *value = gpu->nr_rings;
  59. return 0;
  60. default:
  61. DBG("%s: invalid param: %u", gpu->name, param);
  62. return -EINVAL;
  63. }
  64. }
  65. const struct firmware *
  66. adreno_request_fw(struct adreno_gpu *adreno_gpu, const char *fwname)
  67. {
  68. struct drm_device *drm = adreno_gpu->base.dev;
  69. const struct firmware *fw = NULL;
  70. char *newname;
  71. int ret;
  72. newname = kasprintf(GFP_KERNEL, "qcom/%s", fwname);
  73. if (!newname)
  74. return ERR_PTR(-ENOMEM);
  75. /*
  76. * Try first to load from qcom/$fwfile using a direct load (to avoid
  77. * a potential timeout waiting for usermode helper)
  78. */
  79. if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
  80. (adreno_gpu->fwloc == FW_LOCATION_NEW)) {
  81. ret = request_firmware_direct(&fw, newname, drm->dev);
  82. if (!ret) {
  83. dev_info(drm->dev, "loaded %s from new location\n",
  84. newname);
  85. adreno_gpu->fwloc = FW_LOCATION_NEW;
  86. goto out;
  87. } else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
  88. dev_err(drm->dev, "failed to load %s: %d\n",
  89. newname, ret);
  90. fw = ERR_PTR(ret);
  91. goto out;
  92. }
  93. }
  94. /*
  95. * Then try the legacy location without qcom/ prefix
  96. */
  97. if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
  98. (adreno_gpu->fwloc == FW_LOCATION_LEGACY)) {
  99. ret = request_firmware_direct(&fw, fwname, drm->dev);
  100. if (!ret) {
  101. dev_info(drm->dev, "loaded %s from legacy location\n",
  102. newname);
  103. adreno_gpu->fwloc = FW_LOCATION_LEGACY;
  104. goto out;
  105. } else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
  106. dev_err(drm->dev, "failed to load %s: %d\n",
  107. fwname, ret);
  108. fw = ERR_PTR(ret);
  109. goto out;
  110. }
  111. }
  112. /*
  113. * Finally fall back to request_firmware() for cases where the
  114. * usermode helper is needed (I think mainly android)
  115. */
  116. if ((adreno_gpu->fwloc == FW_LOCATION_UNKNOWN) ||
  117. (adreno_gpu->fwloc == FW_LOCATION_HELPER)) {
  118. ret = request_firmware(&fw, newname, drm->dev);
  119. if (!ret) {
  120. dev_info(drm->dev, "loaded %s with helper\n",
  121. newname);
  122. adreno_gpu->fwloc = FW_LOCATION_HELPER;
  123. goto out;
  124. } else if (adreno_gpu->fwloc != FW_LOCATION_UNKNOWN) {
  125. dev_err(drm->dev, "failed to load %s: %d\n",
  126. newname, ret);
  127. fw = ERR_PTR(ret);
  128. goto out;
  129. }
  130. }
  131. dev_err(drm->dev, "failed to load %s\n", fwname);
  132. fw = ERR_PTR(-ENOENT);
  133. out:
  134. kfree(newname);
  135. return fw;
  136. }
  137. int adreno_load_fw(struct adreno_gpu *adreno_gpu)
  138. {
  139. int i;
  140. for (i = 0; i < ARRAY_SIZE(adreno_gpu->info->fw); i++) {
  141. const struct firmware *fw;
  142. if (!adreno_gpu->info->fw[i])
  143. continue;
  144. /* Skip if the firmware has already been loaded */
  145. if (adreno_gpu->fw[i])
  146. continue;
  147. fw = adreno_request_fw(adreno_gpu, adreno_gpu->info->fw[i]);
  148. if (IS_ERR(fw))
  149. return PTR_ERR(fw);
  150. adreno_gpu->fw[i] = fw;
  151. }
  152. return 0;
  153. }
  154. struct drm_gem_object *adreno_fw_create_bo(struct msm_gpu *gpu,
  155. const struct firmware *fw, u64 *iova)
  156. {
  157. struct drm_gem_object *bo;
  158. void *ptr;
  159. ptr = msm_gem_kernel_new_locked(gpu->dev, fw->size - 4,
  160. MSM_BO_UNCACHED | MSM_BO_GPU_READONLY, gpu->aspace, &bo, iova);
  161. if (IS_ERR(ptr))
  162. return ERR_CAST(ptr);
  163. memcpy(ptr, &fw->data[4], fw->size - 4);
  164. msm_gem_put_vaddr(bo);
  165. return bo;
  166. }
  167. int adreno_hw_init(struct msm_gpu *gpu)
  168. {
  169. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  170. int ret, i;
  171. DBG("%s", gpu->name);
  172. ret = adreno_load_fw(adreno_gpu);
  173. if (ret)
  174. return ret;
  175. for (i = 0; i < gpu->nr_rings; i++) {
  176. struct msm_ringbuffer *ring = gpu->rb[i];
  177. if (!ring)
  178. continue;
  179. ret = msm_gem_get_iova(ring->bo, gpu->aspace, &ring->iova);
  180. if (ret) {
  181. ring->iova = 0;
  182. dev_err(gpu->dev->dev,
  183. "could not map ringbuffer %d: %d\n", i, ret);
  184. return ret;
  185. }
  186. ring->cur = ring->start;
  187. ring->next = ring->start;
  188. /* reset completed fence seqno: */
  189. ring->memptrs->fence = ring->seqno;
  190. ring->memptrs->rptr = 0;
  191. }
  192. /*
  193. * Setup REG_CP_RB_CNTL. The same value is used across targets (with
  194. * the excpetion of A430 that disables the RPTR shadow) - the cacluation
  195. * for the ringbuffer size and block size is moved to msm_gpu.h for the
  196. * pre-processor to deal with and the A430 variant is ORed in here
  197. */
  198. adreno_gpu_write(adreno_gpu, REG_ADRENO_CP_RB_CNTL,
  199. MSM_GPU_RB_CNTL_DEFAULT |
  200. (adreno_is_a430(adreno_gpu) ? AXXX_CP_RB_CNTL_NO_UPDATE : 0));
  201. /* Setup ringbuffer address - use ringbuffer[0] for GPU init */
  202. adreno_gpu_write64(adreno_gpu, REG_ADRENO_CP_RB_BASE,
  203. REG_ADRENO_CP_RB_BASE_HI, gpu->rb[0]->iova);
  204. if (!adreno_is_a430(adreno_gpu)) {
  205. adreno_gpu_write64(adreno_gpu, REG_ADRENO_CP_RB_RPTR_ADDR,
  206. REG_ADRENO_CP_RB_RPTR_ADDR_HI,
  207. rbmemptr(gpu->rb[0], rptr));
  208. }
  209. return 0;
  210. }
  211. /* Use this helper to read rptr, since a430 doesn't update rptr in memory */
  212. static uint32_t get_rptr(struct adreno_gpu *adreno_gpu,
  213. struct msm_ringbuffer *ring)
  214. {
  215. if (adreno_is_a430(adreno_gpu))
  216. return ring->memptrs->rptr = adreno_gpu_read(
  217. adreno_gpu, REG_ADRENO_CP_RB_RPTR);
  218. else
  219. return ring->memptrs->rptr;
  220. }
  221. struct msm_ringbuffer *adreno_active_ring(struct msm_gpu *gpu)
  222. {
  223. return gpu->rb[0];
  224. }
  225. void adreno_recover(struct msm_gpu *gpu)
  226. {
  227. struct drm_device *dev = gpu->dev;
  228. int ret;
  229. // XXX pm-runtime?? we *need* the device to be off after this
  230. // so maybe continuing to call ->pm_suspend/resume() is better?
  231. gpu->funcs->pm_suspend(gpu);
  232. gpu->funcs->pm_resume(gpu);
  233. ret = msm_gpu_hw_init(gpu);
  234. if (ret) {
  235. dev_err(dev->dev, "gpu hw init failed: %d\n", ret);
  236. /* hmm, oh well? */
  237. }
  238. }
  239. void adreno_submit(struct msm_gpu *gpu, struct msm_gem_submit *submit,
  240. struct msm_file_private *ctx)
  241. {
  242. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  243. struct msm_drm_private *priv = gpu->dev->dev_private;
  244. struct msm_ringbuffer *ring = submit->ring;
  245. unsigned i;
  246. for (i = 0; i < submit->nr_cmds; i++) {
  247. switch (submit->cmd[i].type) {
  248. case MSM_SUBMIT_CMD_IB_TARGET_BUF:
  249. /* ignore IB-targets */
  250. break;
  251. case MSM_SUBMIT_CMD_CTX_RESTORE_BUF:
  252. /* ignore if there has not been a ctx switch: */
  253. if (priv->lastctx == ctx)
  254. break;
  255. case MSM_SUBMIT_CMD_BUF:
  256. OUT_PKT3(ring, adreno_is_a430(adreno_gpu) ?
  257. CP_INDIRECT_BUFFER_PFE : CP_INDIRECT_BUFFER_PFD, 2);
  258. OUT_RING(ring, lower_32_bits(submit->cmd[i].iova));
  259. OUT_RING(ring, submit->cmd[i].size);
  260. OUT_PKT2(ring);
  261. break;
  262. }
  263. }
  264. OUT_PKT0(ring, REG_AXXX_CP_SCRATCH_REG2, 1);
  265. OUT_RING(ring, submit->seqno);
  266. if (adreno_is_a3xx(adreno_gpu) || adreno_is_a4xx(adreno_gpu)) {
  267. /* Flush HLSQ lazy updates to make sure there is nothing
  268. * pending for indirect loads after the timestamp has
  269. * passed:
  270. */
  271. OUT_PKT3(ring, CP_EVENT_WRITE, 1);
  272. OUT_RING(ring, HLSQ_FLUSH);
  273. OUT_PKT3(ring, CP_WAIT_FOR_IDLE, 1);
  274. OUT_RING(ring, 0x00000000);
  275. }
  276. /* BIT(31) of CACHE_FLUSH_TS triggers CACHE_FLUSH_TS IRQ from GPU */
  277. OUT_PKT3(ring, CP_EVENT_WRITE, 3);
  278. OUT_RING(ring, CACHE_FLUSH_TS | BIT(31));
  279. OUT_RING(ring, rbmemptr(ring, fence));
  280. OUT_RING(ring, submit->seqno);
  281. #if 0
  282. if (adreno_is_a3xx(adreno_gpu)) {
  283. /* Dummy set-constant to trigger context rollover */
  284. OUT_PKT3(ring, CP_SET_CONSTANT, 2);
  285. OUT_RING(ring, CP_REG(REG_A3XX_HLSQ_CL_KERNEL_GROUP_X_REG));
  286. OUT_RING(ring, 0x00000000);
  287. }
  288. #endif
  289. gpu->funcs->flush(gpu, ring);
  290. }
  291. void adreno_flush(struct msm_gpu *gpu, struct msm_ringbuffer *ring)
  292. {
  293. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  294. uint32_t wptr;
  295. /* Copy the shadow to the actual register */
  296. ring->cur = ring->next;
  297. /*
  298. * Mask wptr value that we calculate to fit in the HW range. This is
  299. * to account for the possibility that the last command fit exactly into
  300. * the ringbuffer and rb->next hasn't wrapped to zero yet
  301. */
  302. wptr = get_wptr(ring);
  303. /* ensure writes to ringbuffer have hit system memory: */
  304. mb();
  305. adreno_gpu_write(adreno_gpu, REG_ADRENO_CP_RB_WPTR, wptr);
  306. }
  307. bool adreno_idle(struct msm_gpu *gpu, struct msm_ringbuffer *ring)
  308. {
  309. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  310. uint32_t wptr = get_wptr(ring);
  311. /* wait for CP to drain ringbuffer: */
  312. if (!spin_until(get_rptr(adreno_gpu, ring) == wptr))
  313. return true;
  314. /* TODO maybe we need to reset GPU here to recover from hang? */
  315. DRM_ERROR("%s: timeout waiting to drain ringbuffer %d rptr/wptr = %X/%X\n",
  316. gpu->name, ring->id, get_rptr(adreno_gpu, ring), wptr);
  317. return false;
  318. }
  319. int adreno_gpu_state_get(struct msm_gpu *gpu, struct msm_gpu_state *state)
  320. {
  321. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  322. int i, count = 0;
  323. kref_init(&state->ref);
  324. ktime_get_real_ts64(&state->time);
  325. for (i = 0; i < gpu->nr_rings; i++) {
  326. int size = 0, j;
  327. state->ring[i].fence = gpu->rb[i]->memptrs->fence;
  328. state->ring[i].iova = gpu->rb[i]->iova;
  329. state->ring[i].seqno = gpu->rb[i]->seqno;
  330. state->ring[i].rptr = get_rptr(adreno_gpu, gpu->rb[i]);
  331. state->ring[i].wptr = get_wptr(gpu->rb[i]);
  332. /* Copy at least 'wptr' dwords of the data */
  333. size = state->ring[i].wptr;
  334. /* After wptr find the last non zero dword to save space */
  335. for (j = state->ring[i].wptr; j < MSM_GPU_RINGBUFFER_SZ >> 2; j++)
  336. if (gpu->rb[i]->start[j])
  337. size = j + 1;
  338. if (size) {
  339. state->ring[i].data = kmalloc(size << 2, GFP_KERNEL);
  340. if (state->ring[i].data) {
  341. memcpy(state->ring[i].data, gpu->rb[i]->start, size << 2);
  342. state->ring[i].data_size = size << 2;
  343. }
  344. }
  345. }
  346. /* Count the number of registers */
  347. for (i = 0; adreno_gpu->registers[i] != ~0; i += 2)
  348. count += adreno_gpu->registers[i + 1] -
  349. adreno_gpu->registers[i] + 1;
  350. state->registers = kcalloc(count * 2, sizeof(u32), GFP_KERNEL);
  351. if (state->registers) {
  352. int pos = 0;
  353. for (i = 0; adreno_gpu->registers[i] != ~0; i += 2) {
  354. u32 start = adreno_gpu->registers[i];
  355. u32 end = adreno_gpu->registers[i + 1];
  356. u32 addr;
  357. for (addr = start; addr <= end; addr++) {
  358. state->registers[pos++] = addr;
  359. state->registers[pos++] = gpu_read(gpu, addr);
  360. }
  361. }
  362. state->nr_registers = count;
  363. }
  364. return 0;
  365. }
  366. void adreno_gpu_state_destroy(struct msm_gpu_state *state)
  367. {
  368. int i;
  369. for (i = 0; i < ARRAY_SIZE(state->ring); i++)
  370. kfree(state->ring[i].data);
  371. for (i = 0; state->bos && i < state->nr_bos; i++)
  372. kvfree(state->bos[i].data);
  373. kfree(state->bos);
  374. kfree(state->comm);
  375. kfree(state->cmd);
  376. kfree(state->registers);
  377. }
  378. static void adreno_gpu_state_kref_destroy(struct kref *kref)
  379. {
  380. struct msm_gpu_state *state = container_of(kref,
  381. struct msm_gpu_state, ref);
  382. adreno_gpu_state_destroy(state);
  383. kfree(state);
  384. }
  385. int adreno_gpu_state_put(struct msm_gpu_state *state)
  386. {
  387. if (IS_ERR_OR_NULL(state))
  388. return 1;
  389. return kref_put(&state->ref, adreno_gpu_state_kref_destroy);
  390. }
  391. #if defined(CONFIG_DEBUG_FS) || defined(CONFIG_DEV_COREDUMP)
  392. static void adreno_show_object(struct drm_printer *p, u32 *ptr, int len)
  393. {
  394. char out[ASCII85_BUFSZ];
  395. long l, datalen, i;
  396. if (!ptr || !len)
  397. return;
  398. /*
  399. * Only dump the non-zero part of the buffer - rarely will any data
  400. * completely fill the entire allocated size of the buffer
  401. */
  402. for (datalen = 0, i = 0; i < len >> 2; i++) {
  403. if (ptr[i])
  404. datalen = (i << 2) + 1;
  405. }
  406. /* Skip printing the object if it is empty */
  407. if (datalen == 0)
  408. return;
  409. l = ascii85_encode_len(datalen);
  410. drm_puts(p, " data: !!ascii85 |\n");
  411. drm_puts(p, " ");
  412. for (i = 0; i < l; i++)
  413. drm_puts(p, ascii85_encode(ptr[i], out));
  414. drm_puts(p, "\n");
  415. }
  416. void adreno_show(struct msm_gpu *gpu, struct msm_gpu_state *state,
  417. struct drm_printer *p)
  418. {
  419. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  420. int i;
  421. if (IS_ERR_OR_NULL(state))
  422. return;
  423. drm_printf(p, "revision: %d (%d.%d.%d.%d)\n",
  424. adreno_gpu->info->revn, adreno_gpu->rev.core,
  425. adreno_gpu->rev.major, adreno_gpu->rev.minor,
  426. adreno_gpu->rev.patchid);
  427. drm_printf(p, "rbbm-status: 0x%08x\n", state->rbbm_status);
  428. drm_puts(p, "ringbuffer:\n");
  429. for (i = 0; i < gpu->nr_rings; i++) {
  430. drm_printf(p, " - id: %d\n", i);
  431. drm_printf(p, " iova: 0x%016llx\n", state->ring[i].iova);
  432. drm_printf(p, " last-fence: %d\n", state->ring[i].seqno);
  433. drm_printf(p, " retired-fence: %d\n", state->ring[i].fence);
  434. drm_printf(p, " rptr: %d\n", state->ring[i].rptr);
  435. drm_printf(p, " wptr: %d\n", state->ring[i].wptr);
  436. drm_printf(p, " size: %d\n", MSM_GPU_RINGBUFFER_SZ);
  437. adreno_show_object(p, state->ring[i].data,
  438. state->ring[i].data_size);
  439. }
  440. if (state->bos) {
  441. drm_puts(p, "bos:\n");
  442. for (i = 0; i < state->nr_bos; i++) {
  443. drm_printf(p, " - iova: 0x%016llx\n",
  444. state->bos[i].iova);
  445. drm_printf(p, " size: %zd\n", state->bos[i].size);
  446. adreno_show_object(p, state->bos[i].data,
  447. state->bos[i].size);
  448. }
  449. }
  450. drm_puts(p, "registers:\n");
  451. for (i = 0; i < state->nr_registers; i++) {
  452. drm_printf(p, " - { offset: 0x%04x, value: 0x%08x }\n",
  453. state->registers[i * 2] << 2,
  454. state->registers[(i * 2) + 1]);
  455. }
  456. }
  457. #endif
  458. /* Dump common gpu status and scratch registers on any hang, to make
  459. * the hangcheck logs more useful. The scratch registers seem always
  460. * safe to read when GPU has hung (unlike some other regs, depending
  461. * on how the GPU hung), and they are useful to match up to cmdstream
  462. * dumps when debugging hangs:
  463. */
  464. void adreno_dump_info(struct msm_gpu *gpu)
  465. {
  466. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  467. int i;
  468. printk("revision: %d (%d.%d.%d.%d)\n",
  469. adreno_gpu->info->revn, adreno_gpu->rev.core,
  470. adreno_gpu->rev.major, adreno_gpu->rev.minor,
  471. adreno_gpu->rev.patchid);
  472. for (i = 0; i < gpu->nr_rings; i++) {
  473. struct msm_ringbuffer *ring = gpu->rb[i];
  474. printk("rb %d: fence: %d/%d\n", i,
  475. ring->memptrs->fence,
  476. ring->seqno);
  477. printk("rptr: %d\n", get_rptr(adreno_gpu, ring));
  478. printk("rb wptr: %d\n", get_wptr(ring));
  479. }
  480. }
  481. /* would be nice to not have to duplicate the _show() stuff with printk(): */
  482. void adreno_dump(struct msm_gpu *gpu)
  483. {
  484. struct adreno_gpu *adreno_gpu = to_adreno_gpu(gpu);
  485. int i;
  486. /* dump these out in a form that can be parsed by demsm: */
  487. printk("IO:region %s 00000000 00020000\n", gpu->name);
  488. for (i = 0; adreno_gpu->registers[i] != ~0; i += 2) {
  489. uint32_t start = adreno_gpu->registers[i];
  490. uint32_t end = adreno_gpu->registers[i+1];
  491. uint32_t addr;
  492. for (addr = start; addr <= end; addr++) {
  493. uint32_t val = gpu_read(gpu, addr);
  494. printk("IO:R %08x %08x\n", addr<<2, val);
  495. }
  496. }
  497. }
  498. static uint32_t ring_freewords(struct msm_ringbuffer *ring)
  499. {
  500. struct adreno_gpu *adreno_gpu = to_adreno_gpu(ring->gpu);
  501. uint32_t size = MSM_GPU_RINGBUFFER_SZ >> 2;
  502. /* Use ring->next to calculate free size */
  503. uint32_t wptr = ring->next - ring->start;
  504. uint32_t rptr = get_rptr(adreno_gpu, ring);
  505. return (rptr + (size - 1) - wptr) % size;
  506. }
  507. void adreno_wait_ring(struct msm_ringbuffer *ring, uint32_t ndwords)
  508. {
  509. if (spin_until(ring_freewords(ring) >= ndwords))
  510. DRM_DEV_ERROR(ring->gpu->dev->dev,
  511. "timeout waiting for space in ringbuffer %d\n",
  512. ring->id);
  513. }
  514. /* Get legacy powerlevels from qcom,gpu-pwrlevels and populate the opp table */
  515. static int adreno_get_legacy_pwrlevels(struct device *dev)
  516. {
  517. struct device_node *child, *node;
  518. int ret;
  519. node = of_get_compatible_child(dev->of_node, "qcom,gpu-pwrlevels");
  520. if (!node) {
  521. dev_err(dev, "Could not find the GPU powerlevels\n");
  522. return -ENXIO;
  523. }
  524. for_each_child_of_node(node, child) {
  525. unsigned int val;
  526. ret = of_property_read_u32(child, "qcom,gpu-freq", &val);
  527. if (ret)
  528. continue;
  529. /*
  530. * Skip the intentionally bogus clock value found at the bottom
  531. * of most legacy frequency tables
  532. */
  533. if (val != 27000000)
  534. dev_pm_opp_add(dev, val, 0);
  535. }
  536. of_node_put(node);
  537. return 0;
  538. }
  539. static int adreno_get_pwrlevels(struct device *dev,
  540. struct msm_gpu *gpu)
  541. {
  542. unsigned long freq = ULONG_MAX;
  543. struct dev_pm_opp *opp;
  544. int ret;
  545. gpu->fast_rate = 0;
  546. /* You down with OPP? */
  547. if (!of_find_property(dev->of_node, "operating-points-v2", NULL))
  548. ret = adreno_get_legacy_pwrlevels(dev);
  549. else {
  550. ret = dev_pm_opp_of_add_table(dev);
  551. if (ret)
  552. dev_err(dev, "Unable to set the OPP table\n");
  553. }
  554. if (!ret) {
  555. /* Find the fastest defined rate */
  556. opp = dev_pm_opp_find_freq_floor(dev, &freq);
  557. if (!IS_ERR(opp)) {
  558. gpu->fast_rate = freq;
  559. dev_pm_opp_put(opp);
  560. }
  561. }
  562. if (!gpu->fast_rate) {
  563. dev_warn(dev,
  564. "Could not find a clock rate. Using a reasonable default\n");
  565. /* Pick a suitably safe clock speed for any target */
  566. gpu->fast_rate = 200000000;
  567. }
  568. DBG("fast_rate=%u, slow_rate=27000000", gpu->fast_rate);
  569. return 0;
  570. }
  571. int adreno_gpu_init(struct drm_device *drm, struct platform_device *pdev,
  572. struct adreno_gpu *adreno_gpu,
  573. const struct adreno_gpu_funcs *funcs, int nr_rings)
  574. {
  575. struct adreno_platform_config *config = pdev->dev.platform_data;
  576. struct msm_gpu_config adreno_gpu_config = { 0 };
  577. struct msm_gpu *gpu = &adreno_gpu->base;
  578. adreno_gpu->funcs = funcs;
  579. adreno_gpu->info = adreno_info(config->rev);
  580. adreno_gpu->gmem = adreno_gpu->info->gmem;
  581. adreno_gpu->revn = adreno_gpu->info->revn;
  582. adreno_gpu->rev = config->rev;
  583. adreno_gpu_config.ioname = "kgsl_3d0_reg_memory";
  584. adreno_gpu_config.irqname = "kgsl_3d0_irq";
  585. adreno_gpu_config.va_start = SZ_16M;
  586. adreno_gpu_config.va_end = 0xffffffff;
  587. adreno_gpu_config.nr_rings = nr_rings;
  588. adreno_get_pwrlevels(&pdev->dev, gpu);
  589. pm_runtime_set_autosuspend_delay(&pdev->dev,
  590. adreno_gpu->info->inactive_period);
  591. pm_runtime_use_autosuspend(&pdev->dev);
  592. pm_runtime_enable(&pdev->dev);
  593. return msm_gpu_init(drm, pdev, &adreno_gpu->base, &funcs->base,
  594. adreno_gpu->info->name, &adreno_gpu_config);
  595. }
  596. void adreno_gpu_cleanup(struct adreno_gpu *adreno_gpu)
  597. {
  598. unsigned int i;
  599. for (i = 0; i < ARRAY_SIZE(adreno_gpu->info->fw); i++)
  600. release_firmware(adreno_gpu->fw[i]);
  601. msm_gpu_cleanup(&adreno_gpu->base);
  602. }