-
Notifications
You must be signed in to change notification settings - Fork 24
/
libsais16.h
373 lines (332 loc) · 19.5 KB
/
libsais16.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
/*--
This file is a part of libsais, a library for linear time suffix array,
longest common prefix array and burrows wheeler transform construction.
Copyright (c) 2021-2024 Ilya Grebnov <[email protected]>
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
Please see the file LICENSE for full copyright information.
--*/
#ifndef LIBSAIS16_H
#define LIBSAIS16_H 1
#define LIBSAIS16_VERSION_MAJOR 2
#define LIBSAIS16_VERSION_MINOR 8
#define LIBSAIS16_VERSION_PATCH 6
#define LIBSAIS16_VERSION_STRING "2.8.6"
#ifdef _WIN32
#ifdef LIBSAIS_SHARED
#ifdef LIBSAIS_EXPORTS
#define LIBSAIS16_API __declspec(dllexport)
#else
#define LIBSAIS16_API __declspec(dllimport)
#endif
#else
#define LIBSAIS16_API
#endif
#else
#define LIBSAIS16_API
#endif
#ifdef __cplusplus
extern "C" {
#endif
#include <stdint.h>
/**
* Creates the libsais16 context that allows reusing allocated memory with each libsais16 operation.
* In multi-threaded environments, use one context per thread for parallel executions.
* @return the libsais16 context, NULL otherwise.
*/
LIBSAIS16_API void * libsais16_create_ctx(void);
#if defined(LIBSAIS_OPENMP)
/**
* Creates the libsais16 context that allows reusing allocated memory with each parallel libsais16 operation using OpenMP.
* In multi-threaded environments, use one context per thread for parallel executions.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return the libsais16 context, NULL otherwise.
*/
LIBSAIS16_API void * libsais16_create_ctx_omp(int32_t threads);
#endif
/**
* Destroys the libsass context and free previusly allocated memory.
* @param ctx The libsais16 context (can be NULL).
*/
LIBSAIS16_API void libsais16_free_ctx(void * ctx);
/**
* Constructs the suffix array of a given 16-bit string.
* @param T [0..n-1] The input 16-bit string.
* @param SA [0..n-1+fs] The output array of suffixes.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of SA array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16(const uint16_t * T, int32_t * SA, int32_t n, int32_t fs, int32_t * freq);
/**
* Constructs the suffix array of a given integer array.
* Note, during construction input array will be modified, but restored at the end if no errors occurred.
* @param T [0..n-1] The input integer array.
* @param SA [0..n-1+fs] The output array of suffixes.
* @param n The length of the integer array.
* @param k The alphabet size of the input integer array.
* @param fs Extra space available at the end of SA array (can be 0, but 4k or better 6k is recommended for optimal performance).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_int(int32_t * T, int32_t * SA, int32_t n, int32_t k, int32_t fs);
/**
* Constructs the suffix array of a given 16-bit string using libsais16 context.
* @param ctx The libsais16 context.
* @param T [0..n-1] The input 16-bit string.
* @param SA [0..n-1+fs] The output array of suffixes.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of SA array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_ctx(const void * ctx, const uint16_t * T, int32_t * SA, int32_t n, int32_t fs, int32_t * freq);
#if defined(LIBSAIS_OPENMP)
/**
* Constructs the suffix array of a given 16-bit string in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param SA [0..n-1+fs] The output array of suffixes.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of SA array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_omp(const uint16_t * T, int32_t * SA, int32_t n, int32_t fs, int32_t * freq, int32_t threads);
/**
* Constructs the suffix array of a given integer array in parallel using OpenMP.
* Note, during construction input array will be modified, but restored at the end if no errors occurred.
* @param T [0..n-1] The input integer array.
* @param SA [0..n-1+fs] The output array of suffixes.
* @param n The length of the integer array.
* @param k The alphabet size of the input integer array.
* @param fs Extra space available at the end of SA array (can be 0, but 4k or better 6k is recommended for optimal performance).
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_int_omp(int32_t * T, int32_t * SA, int32_t n, int32_t k, int32_t fs, int32_t threads);
#endif
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @return The primary index if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq);
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string with auxiliary indexes.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The output auxiliary indexes.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt_aux(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq, int32_t r, int32_t * I);
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string using libsais16 context.
* @param ctx The libsais16 context.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @return The primary index if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt_ctx(const void * ctx, const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq);
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string with auxiliary indexes using libsais16 context.
* @param ctx The libsais16 context.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The output auxiliary indexes.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt_aux_ctx(const void * ctx, const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq, int32_t r, int32_t * I);
#if defined(LIBSAIS_OPENMP)
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return The primary index if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt_omp(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq, int32_t threads);
/**
* Constructs the burrows-wheeler transformed 16-bit string (BWT) of a given 16-bit string with auxiliary indexes in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n-1+fs] The temporary array.
* @param n The length of the given 16-bit string.
* @param fs The extra space available at the end of A array (0 should be enough for most cases).
* @param freq [0..65535] The output 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The output auxiliary indexes.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_bwt_aux_omp(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, int32_t fs, int32_t * freq, int32_t r, int32_t * I, int32_t threads);
#endif
/**
* Creates the libsais16 reverse BWT context that allows reusing allocated memory with each libsais16_unbwt_* operation.
* In multi-threaded environments, use one context per thread for parallel executions.
* @return the libsais16 context, NULL otherwise.
*/
LIBSAIS16_API void * libsais16_unbwt_create_ctx(void);
#if defined(LIBSAIS_OPENMP)
/**
* Creates the libsais16 reverse BWT context that allows reusing allocated memory with each parallel libsais16_unbwt_* operation using OpenMP.
* In multi-threaded environments, use one context per thread for parallel executions.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return the libsais16 context, NULL otherwise.
*/
LIBSAIS16_API void * libsais16_unbwt_create_ctx_omp(int32_t threads);
#endif
/**
* Destroys the libsass reverse BWT context and free previusly allocated memory.
* @param ctx The libsais16 context (can be NULL).
*/
LIBSAIS16_API void libsais16_unbwt_free_ctx(void * ctx);
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with primary index.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param i The primary index.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t i);
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with primary index using libsais16 reverse BWT context.
* @param ctx The libsais16 reverse BWT context.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param i The primary index.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt_ctx(const void * ctx, const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t i);
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with auxiliary indexes.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The input auxiliary indexes.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt_aux(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t r, const int32_t * I);
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with auxiliary indexes using libsais16 reverse BWT context.
* @param ctx The libsais16 reverse BWT context.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The input auxiliary indexes.
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt_aux_ctx(const void * ctx, const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t r, const int32_t * I);
#if defined(LIBSAIS_OPENMP)
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with primary index in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param i The primary index.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt_omp(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t i, int32_t threads);
/**
* Constructs the original 16-bit string from a given burrows-wheeler transformed 16-bit string (BWT) with auxiliary indexes in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param U [0..n-1] The output 16-bit string (can be T).
* @param A [0..n] The temporary array (NOTE, temporary array must be n + 1 size).
* @param n The length of the given 16-bit string.
* @param freq [0..65535] The input 16-bit symbol frequency table (can be NULL).
* @param r The sampling rate for auxiliary indexes (must be power of 2).
* @param I [0..(n-1)/r] The input auxiliary indexes.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 or -2 otherwise.
*/
LIBSAIS16_API int32_t libsais16_unbwt_aux_omp(const uint16_t * T, uint16_t * U, int32_t * A, int32_t n, const int32_t * freq, int32_t r, const int32_t * I, int32_t threads);
#endif
/**
* Constructs the permuted longest common prefix array (PLCP) of a given 16-bit string and a suffix array.
* @param T [0..n-1] The input 16-bit string.
* @param SA [0..n-1] The input suffix array.
* @param PLCP [0..n-1] The output permuted longest common prefix array.
* @param n The length of the 16-bit string and the suffix array.
* @return 0 if no error occurred, -1 otherwise.
*/
LIBSAIS16_API int32_t libsais16_plcp(const uint16_t * T, const int32_t * SA, int32_t * PLCP, int32_t n);
/**
* Constructs the longest common prefix array (LCP) of a given permuted longest common prefix array (PLCP) and a suffix array.
* @param PLCP [0..n-1] The input permuted longest common prefix array.
* @param SA [0..n-1] The input suffix array.
* @param LCP [0..n-1] The output longest common prefix array (can be SA).
* @param n The length of the permuted longest common prefix array and the suffix array.
* @return 0 if no error occurred, -1 otherwise.
*/
LIBSAIS16_API int32_t libsais16_lcp(const int32_t * PLCP, const int32_t * SA, int32_t * LCP, int32_t n);
#if defined(LIBSAIS_OPENMP)
/**
* Constructs the permuted longest common prefix array (PLCP) of a given 16-bit string and a suffix array in parallel using OpenMP.
* @param T [0..n-1] The input 16-bit string.
* @param SA [0..n-1] The input suffix array.
* @param PLCP [0..n-1] The output permuted longest common prefix array.
* @param n The length of the 16-bit string and the suffix array.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 otherwise.
*/
LIBSAIS16_API int32_t libsais16_plcp_omp(const uint16_t * T, const int32_t * SA, int32_t * PLCP, int32_t n, int32_t threads);
/**
* Constructs the longest common prefix array (LCP) of a given permuted longest common prefix array (PLCP) and a suffix array in parallel using OpenMP.
* @param PLCP [0..n-1] The input permuted longest common prefix array.
* @param SA [0..n-1] The input suffix array.
* @param LCP [0..n-1] The output longest common prefix array (can be SA).
* @param n The length of the permuted longest common prefix array and the suffix array.
* @param threads The number of OpenMP threads to use (can be 0 for OpenMP default).
* @return 0 if no error occurred, -1 otherwise.
*/
LIBSAIS16_API int32_t libsais16_lcp_omp(const int32_t * PLCP, const int32_t * SA, int32_t * LCP, int32_t n, int32_t threads);
#endif
#ifdef __cplusplus
}
#endif
#endif