-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathfmd.i
132 lines (105 loc) · 3.46 KB
/
fmd.i
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
// Name the module something Java-y that isn't going to clash with the FMD
// class.
%module FMDUtil
// Set up STL compatibility
%include "std_string.i"
%include "std_vector.i"
%include "std_pair.i"
// Set up exception not-killing-the-process-ness. See
// <http://www.swig.org/Doc1.3/Library.html#Library_nn17>
%include "exception.i"
%exception {
try {
$action
} catch (const std::exception& e) {
SWIG_exception(SWIG_RuntimeError, e.what());
}
}
%{
#include "fmd.h"
using namespace CSA;
%}
#ifdef MASSIVE_DATA_RLCSA
typedef unsigned long usint;
// HACK: This is really a "signed long", but SWIG turns that into a Java int,
// which is clearly smaller. So we lie to it to get it to use a Java long.
// TODO: Use typemaps or something to fix this instead.
typedef unsigned long sint;
#else
typedef unsigned int usint;
typedef signed int sint;
#endif
// Decide uchars are chars here (unlike in rlcsa.i), so every uchar* is a
// string.
typedef char uchar;
// Make sure to rename these things that we swap out with #defines to a
// consistent name. Also note that these "vectors" are bit vectors, not
// std::vectors.
#ifdef USE_NIBBLE_VECTORS
// Use Nibble Vectors to encode our range endpoint bitmaps
%rename(RangeVector) NibbleVector;
typedef NibbleVector RangeVector;
%rename(RangeEncoder) NibbleEncoder;
typedef NibbleEncoder RangeEncoder;
%{
typedef NibbleVector::Iterator RangeVectorIterator;
%}
#else
// Use RLEVectors to encode our range endpoint bitmaps
%rename(RangeVector) RLEVector;
typedef RLEVector RangeVector;
%rename(RangeEncoder) RLEEncoder;
typedef RLEEncoder RangeEncoder;
%{
typedef RLEVector::Iterator RangeVectorIterator;
%}
#endif
// We need to use the inner vector iterator classes to look at vectors. Give a
// partial definition under a new name that works with the conditional typedefs
// above.
class RangeVectorIterator
{
public:
explicit RangeVectorIterator(const CSA::RangeVector& par);
~RangeVectorIterator();
usint rank(usint value, bool at_least = false);
usint select(usint index);
usint selectNext();
pair_type valueBefore(usint value);
pair_type valueAfter(usint value);
pair_type nextValue();
pair_type selectRun(usint index, usint max_length);
pair_type selectNextRun(usint max_length);
bool isSet(usint value);
usint countRuns();
};
// Since we will need to load and save range vectors to files, we need to expose
// a minimal C FILE API.
FILE* fopen(char* filename, char* mode);
void fclose(FILE* file);
// Java needs to work with vectors of mappings coming back from the map method.
%template(MappingVector) std::vector<CSA::Mapping>;
// Java also needs to work with vectors of sints coming back from the map method
// when working on ranges.
%template(SintVector) std::vector<sint>;
// Java needs to work with pair_types that are locate in text results.
typedef std::pair<usint, usint> pair_type;
%template(pair_type) std::pair<usint, usint>;
// Java can't handle this operator name.
%rename(leftShift) operator<<(std::ostream& o, FMDPosition const& position);
// Whenever any of the JNI classes loads, load the native library.
%pragma(java) jniclasscode=%{
static {
RLCSANativeLoader.load();
}
%}
// We already worked around the inner classes thing.
#pragma SWIG nowarn=SWIGWARN_PARSE_NESTED_CLASS
%include "bits/bitvector.h"
#ifdef USE_NIBBLE_VECTORS
%include "bits/nibblevector.h"
#else
%include "bits/rlevector.h"
#endif
%import "rlcsa.h"
%include "fmd.h"