NVBIO
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Groups Pages
filter.h
Go to the documentation of this file.
1 /*
2  * nvbio
3  * Copyright (c) 2011-2014, NVIDIA CORPORATION. All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are met:
7  * * Redistributions of source code must retain the above copyright
8  * notice, this list of conditions and the following disclaimer.
9  * * Redistributions in binary form must reproduce the above copyright
10  * notice, this list of conditions and the following disclaimer in the
11  * documentation and/or other materials provided with the distribution.
12  * * Neither the name of the NVIDIA CORPORATION nor the
13  * names of its contributors may be used to endorse or promote products
14  * derived from this software without specific prior written permission.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19  * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
20  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26  */
27 
28 #pragma once
29 
31 #include <stdio.h>
32 
33 namespace nvbio {
34 namespace alndiff {
35 
36 struct Filter
37 {
38  enum Flags { DISTANT = 1u, DISCORDANT = 2u, DIFFERENT_REF = 4u, ALL = 0xFFFFFFFFu };
39  enum Statistics { ED = 1u, MAPQ = 2u, MMS = 4u, INS = 8u, DELS = 16u, SCORE = 32u };
40 
41  // empty constructor
42  //
43  Filter() : m_file(NULL), m_filtered(0) {}
44 
45  // constructor
46  //
47  // \param file_name output file name
48  // \param flags read flags (DISTANT | DISCORDANT | DIFFERENT_REF | ALL) accepted by the filter
49  // \param stats statistics accepted by the filter
50  // \param delta filtering threshold
51  //
52  Filter(const char* file_name, const uint32 flags, const uint32 stats, const int32 delta) :
53  m_file( NULL ),
54  m_flags( flags ),
55  m_stats( stats ),
56  m_delta( delta ),
57  m_filtered(0)
58  {
59  if (file_name)
60  {
61  log_verbose(stderr, "opening filter file \"%s\"... done\n", file_name);
62  m_file = fopen( file_name, "wb" );
63  if (m_file == NULL)
64  log_warning( stderr, "unable to open filter file \"%s\"\n", file_name );
65  }
66  }
67  // destructor
68  //
70  {
71  if (m_file)
72  {
73  fclose( m_file );
74  log_verbose(stderr, "closing filter file... done\n");
75  }
76  }
77 
78  // push a statistic into the filter
79  //
80  void operator() (const int32 delta, const uint32 flags, const Statistics stat, const uint32 read_id)
81  {
82  if (m_file == NULL)
83  return;
84 
85  if ((m_flags & flags) &&
86  (m_stats & stat) &&
87  (m_delta > 0 ? delta >= m_delta : delta <= m_delta))
88  {
89  fwrite( &read_id, sizeof(uint32), 1u, m_file );
90 
91  ++m_filtered;
92  }
93  }
94 
95  // get filtered count
96  //
97  uint32 filtered() const { return m_filtered; }
98 
99  // flush the file
100  //
101  void flush() { if (m_file) fflush( m_file ); }
102 
103  FILE* m_file;
108 };
109 
110 } // namespace alndiff
111 } // namespace nvbio