gp100.c 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182
  1. /*
  2. * Copyright 2016 Red Hat Inc.
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  17. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20. * OTHER DEALINGS IN THE SOFTWARE.
  21. *
  22. * Authors: Ben Skeggs <bskeggs@redhat.com>
  23. */
  24. #include "gf100.h"
  25. #include "ctxgf100.h"
  26. #include <nvif/class.h>
  27. /*******************************************************************************
  28. * PGRAPH engine/subdev functions
  29. ******************************************************************************/
  30. void
  31. gp100_gr_init_rop_active_fbps(struct gf100_gr *gr)
  32. {
  33. struct nvkm_device *device = gr->base.engine.subdev.device;
  34. /*XXX: otherwise identical to gm200 aside from mask.. do everywhere? */
  35. const u32 fbp_count = nvkm_rd32(device, 0x12006c) & 0x0000000f;
  36. nvkm_mask(device, 0x408850, 0x0000000f, fbp_count); /* zrop */
  37. nvkm_mask(device, 0x408958, 0x0000000f, fbp_count); /* crop */
  38. }
  39. void
  40. gp100_gr_init_num_active_ltcs(struct gf100_gr *gr)
  41. {
  42. struct nvkm_device *device = gr->base.engine.subdev.device;
  43. nvkm_wr32(device, GPC_BCAST(0x08ac), nvkm_rd32(device, 0x100800));
  44. nvkm_wr32(device, GPC_BCAST(0x033c), nvkm_rd32(device, 0x100804));
  45. }
  46. int
  47. gp100_gr_init(struct gf100_gr *gr)
  48. {
  49. struct nvkm_device *device = gr->base.engine.subdev.device;
  50. const u32 magicgpc918 = DIV_ROUND_UP(0x00800000, gr->tpc_total);
  51. u32 data[TPC_MAX / 8] = {};
  52. u8 tpcnr[GPC_MAX];
  53. int gpc, tpc, rop;
  54. int i;
  55. gr->func->init_gpc_mmu(gr);
  56. gf100_gr_mmio(gr, gr->fuc_sw_nonctx);
  57. nvkm_wr32(device, GPC_UNIT(0, 0x3018), 0x00000001);
  58. memset(data, 0x00, sizeof(data));
  59. memcpy(tpcnr, gr->tpc_nr, sizeof(gr->tpc_nr));
  60. for (i = 0, gpc = -1; i < gr->tpc_total; i++) {
  61. do {
  62. gpc = (gpc + 1) % gr->gpc_nr;
  63. } while (!tpcnr[gpc]);
  64. tpc = gr->tpc_nr[gpc] - tpcnr[gpc]--;
  65. data[i / 8] |= tpc << ((i % 8) * 4);
  66. }
  67. nvkm_wr32(device, GPC_BCAST(0x0980), data[0]);
  68. nvkm_wr32(device, GPC_BCAST(0x0984), data[1]);
  69. nvkm_wr32(device, GPC_BCAST(0x0988), data[2]);
  70. nvkm_wr32(device, GPC_BCAST(0x098c), data[3]);
  71. for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
  72. nvkm_wr32(device, GPC_UNIT(gpc, 0x0914),
  73. gr->screen_tile_row_offset << 8 | gr->tpc_nr[gpc]);
  74. nvkm_wr32(device, GPC_UNIT(gpc, 0x0910), 0x00040000 |
  75. gr->tpc_total);
  76. nvkm_wr32(device, GPC_UNIT(gpc, 0x0918), magicgpc918);
  77. }
  78. nvkm_wr32(device, GPC_BCAST(0x3fd4), magicgpc918);
  79. gr->func->init_num_active_ltcs(gr);
  80. gr->func->init_rop_active_fbps(gr);
  81. if (gr->func->init_swdx_pes_mask)
  82. gr->func->init_swdx_pes_mask(gr);
  83. nvkm_wr32(device, 0x400500, 0x00010001);
  84. nvkm_wr32(device, 0x400100, 0xffffffff);
  85. nvkm_wr32(device, 0x40013c, 0xffffffff);
  86. nvkm_wr32(device, 0x400124, 0x00000002);
  87. nvkm_wr32(device, 0x409c24, 0x000f0002);
  88. nvkm_wr32(device, 0x405848, 0xc0000000);
  89. nvkm_mask(device, 0x40584c, 0x00000000, 0x00000001);
  90. nvkm_wr32(device, 0x404000, 0xc0000000);
  91. nvkm_wr32(device, 0x404600, 0xc0000000);
  92. nvkm_wr32(device, 0x408030, 0xc0000000);
  93. nvkm_wr32(device, 0x404490, 0xc0000000);
  94. nvkm_wr32(device, 0x406018, 0xc0000000);
  95. nvkm_wr32(device, 0x407020, 0x40000000);
  96. nvkm_wr32(device, 0x405840, 0xc0000000);
  97. nvkm_wr32(device, 0x405844, 0x00ffffff);
  98. nvkm_mask(device, 0x419cc0, 0x00000008, 0x00000008);
  99. nvkm_mask(device, 0x419c9c, 0x00010000, 0x00010000);
  100. nvkm_mask(device, 0x419c9c, 0x00020000, 0x00020000);
  101. gr->func->init_ppc_exceptions(gr);
  102. for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
  103. nvkm_wr32(device, GPC_UNIT(gpc, 0x0420), 0xc0000000);
  104. nvkm_wr32(device, GPC_UNIT(gpc, 0x0900), 0xc0000000);
  105. nvkm_wr32(device, GPC_UNIT(gpc, 0x1028), 0xc0000000);
  106. nvkm_wr32(device, GPC_UNIT(gpc, 0x0824), 0xc0000000);
  107. for (tpc = 0; tpc < gr->tpc_nr[gpc]; tpc++) {
  108. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x508), 0xffffffff);
  109. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x50c), 0xffffffff);
  110. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x224), 0xc0000000);
  111. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x48c), 0xc0000000);
  112. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x084), 0xc0000000);
  113. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x430), 0xc0000000);
  114. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x644), 0x00dffffe);
  115. nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x64c), 0x00000105);
  116. }
  117. nvkm_wr32(device, GPC_UNIT(gpc, 0x2c90), 0xffffffff);
  118. nvkm_wr32(device, GPC_UNIT(gpc, 0x2c94), 0xffffffff);
  119. }
  120. for (rop = 0; rop < gr->rop_nr; rop++) {
  121. nvkm_wr32(device, ROP_UNIT(rop, 0x144), 0x40000000);
  122. nvkm_wr32(device, ROP_UNIT(rop, 0x070), 0x40000000);
  123. nvkm_wr32(device, ROP_UNIT(rop, 0x204), 0xffffffff);
  124. nvkm_wr32(device, ROP_UNIT(rop, 0x208), 0xffffffff);
  125. }
  126. nvkm_wr32(device, 0x400108, 0xffffffff);
  127. nvkm_wr32(device, 0x400138, 0xffffffff);
  128. nvkm_wr32(device, 0x400118, 0xffffffff);
  129. nvkm_wr32(device, 0x400130, 0xffffffff);
  130. nvkm_wr32(device, 0x40011c, 0xffffffff);
  131. nvkm_wr32(device, 0x400134, 0xffffffff);
  132. gf100_gr_zbc_init(gr);
  133. return gf100_gr_init_ctxctl(gr);
  134. }
  135. static const struct gf100_gr_func
  136. gp100_gr = {
  137. .init = gp100_gr_init,
  138. .init_gpc_mmu = gm200_gr_init_gpc_mmu,
  139. .init_rop_active_fbps = gp100_gr_init_rop_active_fbps,
  140. .init_ppc_exceptions = gk104_gr_init_ppc_exceptions,
  141. .init_num_active_ltcs = gp100_gr_init_num_active_ltcs,
  142. .rops = gm200_gr_rops,
  143. .ppc_nr = 2,
  144. .grctx = &gp100_grctx,
  145. .sclass = {
  146. { -1, -1, FERMI_TWOD_A },
  147. { -1, -1, KEPLER_INLINE_TO_MEMORY_B },
  148. { -1, -1, PASCAL_A, &gf100_fermi },
  149. { -1, -1, PASCAL_COMPUTE_A },
  150. {}
  151. }
  152. };
  153. int
  154. gp100_gr_new(struct nvkm_device *device, int index, struct nvkm_gr **pgr)
  155. {
  156. return gm200_gr_new_(&gp100_gr, device, index, pgr);
  157. }