-
Notifications
You must be signed in to change notification settings - Fork 25
/
Copy pathLSH_helpers.cpp
206 lines (182 loc) · 7.52 KB
/
LSH_helpers.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
#include "LSH.h"
#ifndef INT_MAX
#define INT_MAX 0xffffffff
#endif
//#define PROFILE_READ
typedef std::chrono::high_resolution_clock Clock;
void LSH::getOptimalMinhash(unsigned int *hashIndices, unsigned int *probeDataIdx, int *dataIdx, int *dataMarker, int numInputEntries, int numProbes) {
#if defined DEBUG
std::cout << "[LSH::getOptimalMinhash]" << std::endl;
#endif
#ifdef PROFILE_READ
auto begin = Clock::now();
#endif
#ifndef DEBUG
#pragma omp parallel for
#endif
for (int inputIdx = 0; inputIdx < numInputEntries; inputIdx++) {
#if defined DEBUG
std::cout << "inputIdx " << inputIdx << std::endl;
#endif
unsigned int *hashes = new unsigned int[_numhashes];
int sizenonzeros = dataMarker[inputIdx + 1] - dataMarker[inputIdx];
#if defined DEBUG
if (sizenonzeros > MAGIC_NUMBER || sizenonzeros < 0) {
std::cout << "[LSH::getOptimalMinhash] sizenonzeros = " << sizenonzeros << " (" <<
dataMarker[inputIdx] << "," << dataMarker[inputIdx + 1] << ")" << std::endl;
}
std::cout << "Entering optimalMinHash()" << std::endl;
#endif
optimalMinHash(hashes, (unsigned int*)(dataIdx + dataMarker[inputIdx]), sizenonzeros);
#if defined DEBUG
std::cout << "Exit optimalMinHash()" << std::endl;
#endif
for (int tb = 0; tb < _L; tb++)
{
unsigned int index = 0;
for (int k = 0; k < _K; k++)
{
unsigned int h = hashes[_K*tb + k];
h *= rand1[_K * tb + k];
h ^= h >> 13;
h ^= rand1[_K * tb + k];
index += h*hashes[_K * tb + k];
}
index = (index << 2) >> (32 - _rangePow);
#if defined DEBUG
unsigned long long allHashesIdxVerify =
hashIndicesOutputIdx(_L, numProbes, numInputEntries, inputIdx, 0, tb);
if (allHashesIdxVerify < 0 || allHashesIdxVerify > (numInputEntries * numProbes * _L)) {
std::cout << "AllHErr!" << allHashesIdxVerify << std::endl;
}
#endif
hashIndices[hashIndicesOutputIdx(_L, numProbes, numInputEntries, inputIdx, 0, tb)] = index;
probeDataIdx[hashIndicesOutputIdx(_L, numProbes, numInputEntries, inputIdx, 0, tb)] = inputIdx;
for (int k = 1; k < numProbes; k++) {
hashIndices[hashIndicesOutputIdx(_L, numProbes, numInputEntries, inputIdx, k, tb)] = index ^ (1 << (k - 1));
probeDataIdx[hashIndicesOutputIdx(_L, numProbes, numInputEntries, inputIdx, k, tb)] = inputIdx;
}
}
delete[] hashes;
}
#ifdef PROFILE_READ
auto end = Clock::now();
float etime = (end - begin).count() / (float)1000000;
printf("[LSH::getOptimalMinhash(OpenMP)] Computation %5.3f ms\n", etime);
#endif
#if defined DEBUG
std::cout << "[LSH::getOptimalMinhash] Exit. " << std::endl;
#endif
}
// The range of hashes returned by getRandDoubleHash is 2^_lognumhash = numhash.
unsigned int LSH::getRandDoubleHash(int binid, int count) {
unsigned int tohash = ((binid + 1) << 10) + count;
return ((unsigned int)_randHash[0] * tohash << 3) >> (32 - _lognumhash); // _lognumhash needs to be ceiled.
}
void LSH::optimalMinHash(unsigned int *hashArray, unsigned int *nonZeros, int sizenonzeros) {
/* This function computes the minhash and perform densification. */
unsigned int *hashes = new unsigned int[_numhashes];
unsigned int range = 1 << _rangePow;
// binsize is the number of times the range is larger than the total number of hashes we need.
unsigned int binsize = ceil(range / _numhashes);
for (size_t i = 0; i < _numhashes; i++)
{
hashes[i] = INT_MAX;
}
#if defined DEBUG
std::cout << "[optimalMinHash] Minhashing. " << sizenonzeros << " nonzeros" <<
". First " << nonZeros[0] << std::endl;
if (sizenonzeros > MAGIC_NUMBER || sizenonzeros < 0) return;
#endif
for (size_t i = 0; i < sizenonzeros; i++)
{
unsigned int h = nonZeros[i];
h *= _randa;
h ^= h >> 13;
h *= 0x85ebca6b;
unsigned int curhash = ((unsigned int)(((unsigned int)h*nonZeros[i]) << 5) >> (32 - _rangePow));
unsigned int binid = std::min((unsigned int) floor(curhash / binsize), (unsigned int)(_numhashes - 1));
if (hashes[binid] > curhash)
hashes[binid] = curhash;
}
#if defined DEBUG
std::cout << "[optimalMinHash] Densification. " << std::endl;
#endif
/* Densification of the hash. */
for (size_t i = 0; i < _numhashes; i++)
{
unsigned int next = hashes[i];
if (next != INT_MAX)
{
hashArray[i] = hashes[i];
continue;
}
unsigned int count = 0;
while (next == INT_MAX)
{
count++;
unsigned int index = std::min(
(unsigned)getRandDoubleHash((unsigned int)i, count),
(unsigned)_numhashes);
next = hashes[index]; // Kills GPU.
if (count > 100) // Densification failure.
break;
}
hashArray[i] = next;
}
delete[] hashes;
#if defined DEBUG
std::cout << "[optimalMinHash] Exit. " << std::endl;
#endif
}
void LSH::srp_openmp_sparse(unsigned int *hashes, int *dataIdx, float *dataVal, int *dataMarker, int numInputEntries) {
unsigned int a1, a2, b1, b2, sparseLen, indice, start, ok;
float value;
#pragma omp parallel private(sparseLen, indice, start, ok, a1, a2, b1, b2, value)
#pragma omp for
for (int i = 0; i < numInputEntries; i++) {
start = dataMarker[i];
sparseLen = dataMarker[i + 1] - start;
for (int tb = 0; tb < _numTables; tb++) {
for (int hashIdx = 0; hashIdx < _rangePow; hashIdx++) {
value = 0;
a1 = _hash_a[tb * _rangePow + hashIdx];
b1 = _hash_b[tb * _rangePow + hashIdx];
a2 = _binhash_a[tb * _rangePow + hashIdx];
b2 = _binhash_b[tb * _rangePow + hashIdx];
for (unsigned int k = 0; k < sparseLen; k++) {
indice = dataIdx[start + k]; // This step is TOO slow, especially when sparseLen is large.
ok = BINARY_HASH(indice, a2, b2);
value += (UNIVERSAL_HASH(indice, _samFactor, a1, b1) == 1) ? (ok ? dataVal[start + indice] : (-dataVal[start + indice])) : 0;
}
hashes[hashesOutputIdx(_rangePow, numInputEntries, i, tb, hashIdx)] = value > 0;
}
}
}
}
void LSH::srp_opencl_dense(cl_mem *hashes_obj, cl_mem *input_obj, int numInputEntries) {
_err = clSetKernelArg(kernel_randproj_dense, 0, sizeof(cl_mem), (void *)hashes_obj);
_err |= clSetKernelArg(kernel_randproj_dense, 1, sizeof(cl_mem), (void *)input_obj);
_err |= clSetKernelArg(kernel_randproj_dense, 4, sizeof(int), (void *)&numInputEntries);
ClCheckError(_err, "Failed to set kernel_randproj arguments!");
size_t gsize_kernel_randproj_dense[3] = { _rangePow, numInputEntries / _groupHashingSize, _numTables };
size_t lsize_kernel_randproj_dense[3] = { _rangePow, 1, 1 };
_err = clEnqueueNDRangeKernel(_command_queue_lsh, kernel_randproj_dense, 3, NULL,
gsize_kernel_randproj_dense, lsize_kernel_randproj_dense, 0, NULL, NULL);
clFinish(_command_queue_lsh);
ClCheckError(_err, "kernel_randproj failed!");
}
void LSH::srp_opencl_sparse(cl_mem *hashes_obj, cl_mem *dataIdx_obj, cl_mem *dataVal_obj, cl_mem *dataMarker_obj, int numInputEntries) {
_err = clSetKernelArg(kernel_randproj_sparse, 0, sizeof(cl_mem), (void *)hashes_obj);
_err |= clSetKernelArg(kernel_randproj_sparse, 1, sizeof(cl_mem), (void *)dataIdx_obj);
_err |= clSetKernelArg(kernel_randproj_sparse, 2, sizeof(cl_mem), (void *)dataVal_obj);
_err |= clSetKernelArg(kernel_randproj_sparse, 3, sizeof(cl_mem), (void *)dataMarker_obj);
_err |= clSetKernelArg(kernel_randproj_sparse, 8, sizeof(int), (void *)&numInputEntries);
ClCheckError(_err, "Failed to set kernel_randproj_sparse arguments!");
size_t gsize_kernel_randproj_sparse[3] = { _rangePow, numInputEntries / _groupHashingSize, _numTables };
size_t lsize_kernel_randproj_sparse[3] = { _rangePow, 1, 1 };
_err = clEnqueueNDRangeKernel(_command_queue_lsh, kernel_randproj_sparse, 3, NULL,
gsize_kernel_randproj_sparse, lsize_kernel_randproj_sparse, 0, NULL, NULL);
clFinish(_command_queue_lsh);
ClCheckError(_err, "kernel_randproj_sparse failed!");
}