NVBIO
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
bwt.h
Go to the documentation of this file.
1 /*
2  * nvbio
3  * Copyright (c) 2011-2014, NVIDIA CORPORATION. All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are met:
7  * * Redistributions of source code must retain the above copyright
8  * notice, this list of conditions and the following disclaimer.
9  * * Redistributions in binary form must reproduce the above copyright
10  * notice, this list of conditions and the following disclaimer in the
11  * documentation and/or other materials provided with the distribution.
12  * * Neither the name of the NVIDIA CORPORATION nor the
13  * names of its contributors may be used to endorse or promote products
14  * derived from this software without specific prior written permission.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19  * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
20  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 
28 #pragma once
29 
30 #include <nvbio/basic/types.h>
31 #include <sais.h>
32 
33 namespace nvbio {
34 
38 template <typename StreamIterator>
39 uint32 gen_sa(const uint32 n, const StreamIterator T, int32 *SA)
40 {
41  SA[0] = n;
42  if (n <= 1) {
43  if (n == 1) SA[1] = 0;
44  return 0;
45  }
46  return saisxx( T, SA+1, int32(n), 4 );
47 }
48 
51 template <typename StreamIterator>
52 uint32 gen_bwt_from_sa(const uint32 n, const StreamIterator T, const int32* SA, StreamIterator bwt)
53 {
54  uint32 i, primary = 0;
55 
56  for (i = 0; i <= n; ++i)
57  {
58  if (SA[i] == 0) primary = i;
59  else bwt[i] = T[SA[i] - 1];
60  }
61  for (i = primary; i < n; ++i) bwt[i] = bwt[i + 1];
62  return primary;
63 }
64 
67 template <typename StreamIterator>
68 int32 gen_bwt(const uint32 n, const StreamIterator T, int32* buffer, StreamIterator bwt)
69 {
70  return saisxx_bwt( T, bwt, buffer, int32(n), 4 );
71 }
72 
75 template <typename StreamIterator>
76 int64 gen_bwt(const uint32 n, const StreamIterator T, int64* buffer, StreamIterator bwt)
77 {
78  return saisxx_bwt( T, bwt, buffer, int64(n), int64(4) );
79 }
80 
81 // generate table for counting 11,10,01,00(pattern) for 8 bits number
82 // table [no# ] = representation ( # of count-pattern, . , . , . )
83 // ---------------------------------------------------------------------------
84 // e.g cnt_table[11111111] = 0x04000000 ( 4-11, 0-10, 0-01, 0-00 )
85 // cnt_table[00100001] = 0x00010102 ( 0-11, 1-10, 1-01, 2-00 )
86 // cnt_table[00000001] = 0x00000103 ( 0-11, 0-10, 1-01, 3-00 )
87 inline void gen_bwt_count_table(uint32* count_table)
88 {
89  for (int i = 0; i != 256; ++i)
90  {
91  uint32 x = 0;
92  for (int j = 0; j != 4; ++j)
93  x |= (((i&3) == j) + ((i>>2&3) == j) + ((i>>4&3) == j) + (i>>6 == j)) << (j<<3);
94 
95  count_table[i] = x;
96  }
97 }
98 
99 } // namespace nvbio
100