hls-performance-thesis/code/fpga/ndrange.cl

48 lines
1.5 KiB
Common Lisp
Raw Permalink Normal View History

2021-07-03 15:59:32 +00:00
#define LOCAL_SIZE 300
inline static int string_index(__global char *s, char c) {
int i = 0;
while (1) {
if (s[i] == c)
return i;
++i;
}
}
kernel
__attribute__((reqd_work_group_size(LOCAL_SIZE, 1, 1)))
__attribute__((xcl_zero_global_work_offset))
void fmindex(__global char *bwt,
__global char *alphabet,
__global unsigned *ranks,
__global unsigned *sa,
__global unsigned *ranges,
__global char *patterns,
__global unsigned long *out,
size_t bwt_sz, size_t alphabet_sz, unsigned pattern_count,
unsigned pattern_sz, unsigned out_sz) {
__attribute__((xcl_pipeline_workitems)) {
int i = get_global_id(0);
int p_idx = pattern_sz - 1;
char c = patterns[i * pattern_sz + p_idx];
int alphabet_idx = string_index(alphabet, c);
unsigned start = ranges[2 * alphabet_idx];
unsigned end = ranges[2 * alphabet_idx + 1];
p_idx -= 1;
while (p_idx >= 0 && end > 1) {
c = patterns[i * pattern_sz + p_idx];
alphabet_idx = string_index(alphabet, c);
unsigned range_start = ranges[2 * alphabet_idx];
start = range_start + ranks[alphabet_sz * (start - 1) + alphabet_idx];
end = range_start + ranks[alphabet_sz * (end - 1) + alphabet_idx];
p_idx -= 1;
}
unsigned long match_count = end - start;
out[i * out_sz] = match_count;
for (unsigned j = 0; j < match_count; ++j)
out[i * out_sz + j + 1] = sa[start + j];
}
}