| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 1 | /* ===-- popcountdi2.c - Implement __popcountdi2 ----------------------------=== |
| 2 | * |
| 3 | * The LLVM Compiler Infrastructure |
| 4 | * |
| Howard Hinnant | 9ad441f | 2010-11-16 22:13:33 +0000 | [diff] [blame] | 5 | * This file is dual licensed under the MIT and the University of Illinois Open |
| 6 | * Source Licenses. See LICENSE.TXT for details. |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 7 | * |
| 8 | * ===----------------------------------------------------------------------=== |
| 9 | * |
| 10 | * This file implements __popcountdi2 for the compiler_rt library. |
| 11 | * |
| 12 | * ===----------------------------------------------------------------------=== |
| 13 | */ |
| Anton Korobeynikov | 1c5f89b | 2011-04-19 17:52:09 +0000 | [diff] [blame^] | 14 | #include "abi.h" |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 15 | |
| 16 | #include "int_lib.h" |
| 17 | |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 18 | /* Returns: count of 1 bits */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 19 | |
| Anton Korobeynikov | 1c5f89b | 2011-04-19 17:52:09 +0000 | [diff] [blame^] | 20 | COMPILER_RT_ABI si_int |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 21 | __popcountdi2(di_int a) |
| 22 | { |
| 23 | du_int x2 = (du_int)a; |
| 24 | x2 = x2 - ((x2 >> 1) & 0x5555555555555555uLL); |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 25 | /* Every 2 bits holds the sum of every pair of bits (32) */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 26 | x2 = ((x2 >> 2) & 0x3333333333333333uLL) + (x2 & 0x3333333333333333uLL); |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 27 | /* Every 4 bits holds the sum of every 4-set of bits (3 significant bits) (16) */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 28 | x2 = (x2 + (x2 >> 4)) & 0x0F0F0F0F0F0F0F0FuLL; |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 29 | /* Every 8 bits holds the sum of every 8-set of bits (4 significant bits) (8) */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 30 | su_int x = (su_int)(x2 + (x2 >> 32)); |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 31 | /* The lower 32 bits hold four 16 bit sums (5 significant bits). */ |
| 32 | /* Upper 32 bits are garbage */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 33 | x = x + (x >> 16); |
| Edward O'Callaghan | 1fcb40b | 2009-08-05 19:06:50 +0000 | [diff] [blame] | 34 | /* The lower 16 bits hold two 32 bit sums (6 significant bits). */ |
| 35 | /* Upper 16 bits are garbage */ |
| 36 | return (x + (x >> 8)) & 0x0000007F; /* (7 significant bits) */ |
| Daniel Dunbar | b3a6901 | 2009-06-26 16:47:03 +0000 | [diff] [blame] | 37 | } |