hweight_64.S 2.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116
  1. /*
  2. * This program is free software; you can redistribute it and/or modify
  3. * it under the terms of the GNU General Public License as published by
  4. * the Free Software Foundation; either version 2 of the License, or
  5. * (at your option) any later version.
  6. *
  7. * This program is distributed in the hope that it will be useful,
  8. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  9. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  10. * GNU General Public License for more details.
  11. *
  12. * You should have received a copy of the GNU General Public License
  13. * along with this program; if not, write to the Free Software
  14. * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
  15. *
  16. * Copyright (C) IBM Corporation, 2010
  17. *
  18. * Author: Anton Blanchard <anton@au.ibm.com>
  19. */
  20. #include <asm/processor.h>
  21. #include <asm/ppc_asm.h>
  22. #include <asm/export.h>
  23. #include <asm/feature-fixups.h>
  24. /* Note: This code relies on -mminimal-toc */
  25. _GLOBAL(__arch_hweight8)
  26. BEGIN_FTR_SECTION
  27. b __sw_hweight8
  28. nop
  29. nop
  30. FTR_SECTION_ELSE
  31. PPC_POPCNTB(R3,R3)
  32. clrldi r3,r3,64-8
  33. blr
  34. ALT_FTR_SECTION_END_IFCLR(CPU_FTR_POPCNTB)
  35. EXPORT_SYMBOL(__arch_hweight8)
  36. _GLOBAL(__arch_hweight16)
  37. BEGIN_FTR_SECTION
  38. b __sw_hweight16
  39. nop
  40. nop
  41. nop
  42. nop
  43. FTR_SECTION_ELSE
  44. BEGIN_FTR_SECTION_NESTED(50)
  45. PPC_POPCNTB(R3,R3)
  46. srdi r4,r3,8
  47. add r3,r4,r3
  48. clrldi r3,r3,64-8
  49. blr
  50. FTR_SECTION_ELSE_NESTED(50)
  51. clrlwi r3,r3,16
  52. PPC_POPCNTW(R3,R3)
  53. clrldi r3,r3,64-8
  54. blr
  55. ALT_FTR_SECTION_END_NESTED_IFCLR(CPU_FTR_POPCNTD, 50)
  56. ALT_FTR_SECTION_END_IFCLR(CPU_FTR_POPCNTB)
  57. EXPORT_SYMBOL(__arch_hweight16)
  58. _GLOBAL(__arch_hweight32)
  59. BEGIN_FTR_SECTION
  60. b __sw_hweight32
  61. nop
  62. nop
  63. nop
  64. nop
  65. nop
  66. nop
  67. FTR_SECTION_ELSE
  68. BEGIN_FTR_SECTION_NESTED(51)
  69. PPC_POPCNTB(R3,R3)
  70. srdi r4,r3,16
  71. add r3,r4,r3
  72. srdi r4,r3,8
  73. add r3,r4,r3
  74. clrldi r3,r3,64-8
  75. blr
  76. FTR_SECTION_ELSE_NESTED(51)
  77. PPC_POPCNTW(R3,R3)
  78. clrldi r3,r3,64-8
  79. blr
  80. ALT_FTR_SECTION_END_NESTED_IFCLR(CPU_FTR_POPCNTD, 51)
  81. ALT_FTR_SECTION_END_IFCLR(CPU_FTR_POPCNTB)
  82. EXPORT_SYMBOL(__arch_hweight32)
  83. _GLOBAL(__arch_hweight64)
  84. BEGIN_FTR_SECTION
  85. b __sw_hweight64
  86. nop
  87. nop
  88. nop
  89. nop
  90. nop
  91. nop
  92. nop
  93. nop
  94. FTR_SECTION_ELSE
  95. BEGIN_FTR_SECTION_NESTED(52)
  96. PPC_POPCNTB(R3,R3)
  97. srdi r4,r3,32
  98. add r3,r4,r3
  99. srdi r4,r3,16
  100. add r3,r4,r3
  101. srdi r4,r3,8
  102. add r3,r4,r3
  103. clrldi r3,r3,64-8
  104. blr
  105. FTR_SECTION_ELSE_NESTED(52)
  106. PPC_POPCNTD(R3,R3)
  107. clrldi r3,r3,64-8
  108. blr
  109. ALT_FTR_SECTION_END_NESTED_IFCLR(CPU_FTR_POPCNTD, 52)
  110. ALT_FTR_SECTION_END_IFCLR(CPU_FTR_POPCNTB)
  111. EXPORT_SYMBOL(__arch_hweight64)