NVBIO
Main Page
Modules
Classes
Examples
File List
File Members
•
All
Classes
Namespaces
Files
Functions
Variables
Typedefs
Enumerations
Enumerator
Friends
Macros
Groups
Pages
nvbio
io
vcf.h
Go to the documentation of this file.
1
/*
2
* nvbio
3
* Copyright (c) 2011-2014, NVIDIA CORPORATION. All rights reserved.
4
*
5
* Redistribution and use in source and binary forms, with or without
6
* modification, are permitted provided that the following conditions are met:
7
* * Redistributions of source code must retain the above copyright
8
* notice, this list of conditions and the following disclaimer.
9
* * Redistributions in binary form must reproduce the above copyright
10
* notice, this list of conditions and the following disclaimer in the
11
* documentation and/or other materials provided with the distribution.
12
* * Neither the name of the NVIDIA CORPORATION nor the
13
* names of its contributors may be used to endorse or promote products
14
* derived from this software without specific prior written permission.
15
*
16
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
17
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
18
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
19
* DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
20
* DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
21
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
22
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
23
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
24
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26
*/
27
28
#include <
nvbio/basic/types.h
>
29
#include <
nvbio/basic/vector.h
>
30
#include <
nvbio/basic/packed_vector.h
>
31
32
#include <vector>
33
#include <string>
34
35
#pragma once
36
37
namespace
nvbio {
38
namespace
io {
39
40
struct
SNP_sequence_index
41
{
42
// these indices are stored in base-pairs since variants are extremely short
43
uint32
reference_start
;
44
uint32
reference_len
;
45
uint32
variant_start
;
46
uint32
variant_len
;
47
48
SNP_sequence_index
()
49
:
reference_start
(0),
reference_len
(0),
50
variant_start
(0),
variant_len
(0)
51
{ }
52
53
SNP_sequence_index
(
uint32
reference_start
,
uint32
reference_len
,
54
uint32
variant_start
,
uint32
variant_len
)
55
: reference_start(reference_start), reference_len(reference_len),
56
variant_start(variant_start), variant_len(variant_len)
57
{ }
58
};
59
60
struct
SNPDatabase
61
{
62
// the name of the reference sequence
63
// note: VCF allows this to be an integer ID encoded in a string that references
64
// a contig from an assembly referenced in the header; this is not supported yet
65
std::vector<std::string>
reference_sequence_names
;
66
67
// start (x) and stop (y) positions of the variant in the reference sequence (first base in the sequence is position 1)
68
// the "stop" position is either start + len or the contents of the END= info tag
69
nvbio::vector<host_tag, uint2>
sequence_positions
;
70
71
// packed reference sequences
72
nvbio::PackedVector<host_tag, 4>
reference_sequences
;
73
// packed variant sequences
74
nvbio::PackedVector<host_tag, 4>
variants
;
75
// an index for both references and variants
76
nvbio::vector<host_tag, SNP_sequence_index>
ref_variant_index
;
77
78
// quality value assigned to each variant
79
nvbio::vector<host_tag, uint8>
variant_qualities
;
80
81
SNPDatabase
()
82
{
83
reference_sequences
.clear();
84
variants
.clear();
85
ref_variant_index
.clear();
86
}
87
};
88
89
// loads variant data from file_name and appends to output
90
bool
loadVCF
(SNPDatabase& output,
const
char
*file_name);
91
92
}
// namespace io
93
}
// namespace nvbio
Generated on Wed Feb 25 2015 08:32:48 for NVBIO by
1.8.4