mirror of https://github.com/apache/druid.git
GroupBy v2: Improve hash code distribution. (#3407)
Without this transformation, distribution of hash % X is poor in general. It is catastrophically poor when X is a multiple of 31 (many slots would be empty).
This commit is contained in:
parent
f037dfcaa4
commit
b11e9544ea
|
@ -46,7 +46,9 @@ public class Groupers
|
||||||
public static int hash(final Object obj)
|
public static int hash(final Object obj)
|
||||||
{
|
{
|
||||||
// Mask off the high bit so we can use that to determine if a bucket is used or not.
|
// Mask off the high bit so we can use that to determine if a bucket is used or not.
|
||||||
return obj.hashCode() & 0x7fffffff;
|
// Also apply the same XOR transformation that j.u.HashMap applies, to improve distribution.
|
||||||
|
final int code = obj.hashCode();
|
||||||
|
return (code ^ (code >>> 16)) & 0x7fffffff;
|
||||||
}
|
}
|
||||||
|
|
||||||
public static <KeyType extends Comparable<KeyType>> Iterator<Grouper.Entry<KeyType>> mergeIterators(
|
public static <KeyType extends Comparable<KeyType>> Iterator<Grouper.Entry<KeyType>> mergeIterators(
|
||||||
|
|
Loading…
Reference in New Issue