-
Notifications
You must be signed in to change notification settings - Fork 1.4k
/
UniversalHashingFamily.cs
126 lines (104 loc) · 4.85 KB
/
UniversalHashingFamily.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
/***
* Universal-Hashing Functions Family.
*
* Implements a family class of simple universal-hashing functions.
* Supports re-generation of functions.
* It depends on the Common/PrimesList helper class.
*
* This class is used in the Cuckoo Hash Table implementation.
*/
using System;
using DataStructures.Common;
namespace DataStructures.Hashing
{
/// <summary>
/// Implements a family of Universal Hash Functions
/// </summary>
public class UniversalHashingFamily
{
// A large prime, arbitrarily chosen
// In decimal = 2,146,435,069;
private const int BIG_PRIME = 0x7FEFFFFD;
private Random _randomizer { get; set; }
private int _numberOfHashFunctions { get; set; }
private int[] _firstMultipliersVector { get; set; }
private int[] _secondMultipliersVector { get; set; }
private static readonly PrimesList _primes = PrimesList.Instance;
/// <summary>
/// Initializes the family with a specified number of hash functions.
/// </summary>
public UniversalHashingFamily(int numberOfHashFunctions)
{
if (numberOfHashFunctions <= 0)
throw new ArgumentOutOfRangeException("Number of hash functions should be greater than zero.");
_randomizer = new Random();
_numberOfHashFunctions = numberOfHashFunctions;
_firstMultipliersVector = new int[_numberOfHashFunctions];
_secondMultipliersVector = new int[_numberOfHashFunctions];
GenerateNewFunctions();
}
/// <summary>
/// Returns number of member hash functions.
/// </summary>
public int NumberOfFunctions
{
get { return _numberOfHashFunctions; }
}
/// <summary>
/// Generates new hash functions with new randomized multipliers.
/// </summary>
public void GenerateNewFunctions()
{
// Clear the multipliers vectors
Array.Clear(_firstMultipliersVector, 0, _firstMultipliersVector.Length);
Array.Clear(_secondMultipliersVector, 0, _secondMultipliersVector.Length);
int randomMin = 0;
int randomMax = _primes.Count - 1;
for (int i = 0; i < _numberOfHashFunctions; i++)
{
// Get only the primes that are smaller than the biggest-chosen prime.
int randomIndex = _randomizer.Next(randomMin, randomMax);
while (_primes[randomIndex] >= BIG_PRIME)
randomIndex = _randomizer.Next(randomMin, randomMax);
_firstMultipliersVector[i] = _primes[randomIndex];
// make sure the next prime we choose is different than the first one and less than the biggest-prime.
randomIndex = _randomizer.Next(randomMin, randomMax);
while (_primes[randomIndex] >= BIG_PRIME || _primes[randomIndex] == _firstMultipliersVector[i])
randomIndex = _randomizer.Next(randomMin, randomMax);
_secondMultipliersVector[i] = _primes[randomIndex];
}
}
/// <summary>
/// Returns hash value of a string, given the specified number of the hash function to use.
/// </summary>
/// <param name="preHashedKey">Int pre-hash code of an object.</param>
/// <param name="whichHashFunction">Non-zero, non-negative integer that specified the number of the hash function to use.</param>
/// <returns></returns>
public int UniversalHash(int preHashedKey, int whichHashFunction)
{
if (whichHashFunction <= 0 || whichHashFunction > _numberOfHashFunctions)
throw new ArgumentOutOfRangeException("WhichHashFunction parameter should be greater than zero or equal to the number of Hash Functions.");
int a = _firstMultipliersVector[whichHashFunction - 1];
int b = _secondMultipliersVector[whichHashFunction - 1];
return ((a * preHashedKey) + b) % BIG_PRIME;
}
/// <summary>
/// Returns hash value of a string, given the specified number of the hash function to use.
/// </summary>
/// <param name="key">string key.</param>
/// <param name="whichHashFunction">Non-zero, non-negative integer that specified the number of the hash function to use.</param>
public int UniversalHash(string key, int whichHashFunction)
{
if (string.IsNullOrEmpty(key))
throw new ArgumentException("Key is either an empty string or null.");
int prehash = 0;
var characters = key.ToCharArray();
int n = characters.Length;
for (int i = 0; i < n; ++i)
{
prehash = prehash + (characters[i] ^ (n - 1));
}
return UniversalHash(prehash, whichHashFunction);
}
}
}