-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathquerycontext.h
127 lines (108 loc) · 3 KB
/
querycontext.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
// slash - a locality sensitive hashing library.
// Copyright (c) 2013 Utkan Güngördü <[email protected]>
//
// This program is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program. If not, see <http://www.gnu.org/licenses/>.
#ifndef SLASH_QUERYCONTEXT_H
#define SLASH_QUERYCONTEXT_H
#include <vector>
#include <stdlib.h>
#include "float.h"
namespace slash {
// Max-similarity search context
template <class FeatureVector>
class QueryContext {
float curmin;
size_t curminIndex;
std::vector<FeatureVector> neighbors;
std::vector<float> similarities;
std::vector<int> ncopies;
int limit;
int found;
int uniques;
inline void updateMin() {
float curmin = FLT_MAX;
size_t curminIndex = -1;
for (int i=0; i<this->uniques; i++) {
float s = this->similarities[i];
if (s < curmin) {
curmin = s;
curminIndex = i;
}
}
this->curmin = curmin;
this->curminIndex = curminIndex;
}
public:
inline void Insert(const FeatureVector &q, float s, int n) {
if (n <= 0) {
return;
}
if (this->found >= this->limit && s <= this->curmin) {
return;
}
if (this->found < this->limit) {
this->neighbors.push_back(q);
this->similarities.push_back(s);
this->ncopies.push_back(n);
this->found += n;
this->uniques++;
if (this->uniques == this->limit) {
this->updateMin();
}
return;
}
this->found -= this->ncopies[this->curminIndex];
this->neighbors[this->curminIndex] = q;
this->similarities[this->curminIndex] = s;
this->ncopies[this->curminIndex] = n;
this->found += n;
this->updateMin();
}
inline std::vector<FeatureVector> Neighbors() {
return this->neighbors;
}
inline int Limit() {
return this->limit;
}
// Used internally by LSH::Query. Don't use.
// Removes the most similar item in a quick & dirty way.
// Assumes that there will be no further operations other than Neighbors.
inline void shrink() {
float curmax = -FLT_MAX;
size_t curmaxIndex = -1;
for (int i=0; i<this->uniques; i++) {
float s = this->similarities[i];
if (s > curmax) {
curmax = s;
curmaxIndex = i;
}
}
if(this->ncopies[curmaxIndex]-1 > 0) {
return;
}
this->neighbors[curmaxIndex] = this->neighbors.back();
this->neighbors.pop_back();
}
explicit QueryContext(int limit) {
this->limit = limit;
this->neighbors.reserve(limit);
this->similarities.reserve(limit);
this->ncopies.reserve(limit);
this->curmin = FLT_MAX;
this->found = 0;
this->uniques = 0;
}
};
};
#endif // SLASH_QUERYCONTEXT_H