vdj_pipe
pipeline for processing DNA sequence data
|
Generalized DNA suffix tree. More...
#include <gdst.hpp>
Classes | |
struct | Err |
Public Types | |
typedef detail::Id_map< Seq_id, Seq_entry > | seq_map |
typedef boost::shared_ptr< seq_map > | seq_map_ptr |
typedef Seq_pos< Seq_id > | match_type |
typedef std::vector< match_type > | match_vector |
Public Member Functions | |
Gdst () | |
Gdst (seq_map_ptr ss) | |
std::size_t | size () const |
Depth_iter | depth_first () const |
Branch_id | root () const |
seq_map const & | sequence_map () const |
seq_map & | sequence_map () |
Branch const & | operator[] (const Branch_id bid) const |
Leaf const & | operator[] (const Leaf_id lid) const |
Seq_entry const & | operator[] (const Seq_id sid) const |
Leaf const & | leaf (const Branch_id bid) const |
const seq_type | suffix (const Seq_id sid, const unsigned len) const |
const seq_type | suffix (const Leaf_id lid, const unsigned len) const |
const seq_type | suffix (Branch const &b) const |
const seq_type | suffix (const Branch_id bid) const |
Nucleotide | letter (const Branch_id bid, const unsigned i) const |
Nucleotide | letter (const Branch_id bid, const Nucleotide n, const unsigned i) const |
Branch_id | child (const Branch_id bid1, const Nucleotide n) const |
Branch_id | child (const Branch_id bid1, const seq_type seq) const |
void | child (const Branch_id bid1, const Nucleotide n, const Branch_id bid2) |
Common_subseq | find_longest (const seq_type seq, std::size_t min_len=0) const |
void | find_overlaping (const boost::string_ref seq, detail::Vector_set< Seq_id > &vs, std::size_t min_overlap=0) const |
Match | find (const seq_type seq, const Branch_id bid, unsigned min_d=0) const |
void | insert (const Seq_id sid) |
Private Types | |
typedef detail::Id_map< Branch_id, Branch > | branch_map |
typedef detail::Id_map< Leaf_id, Leaf > | leaf_map |
typedef detail::Id_map< Children_id, Children > | children_map |
typedef boost::string_ref | seq_type |
Private Member Functions | |
void | collect_sequences (const gdst::Branch_id nid, detail::Vector_set< Seq_id > &vs) const |
void | suffix_link (const Branch_id bid1, const Branch_id bid2) |
Branch_id | suffix_link (const Branch_id bid) const |
unsigned | edge_length (const Branch_id bid, const Nucleotide n) const |
unsigned | edge_length (const Branch_id bid, const seq_type suff) const |
void | check_edge (Branch_id &an, unsigned &aei, unsigned &al, const boost::string_ref seq) const |
void | add_to_leaf (const Branch_id bid, const Seq_id sid) |
Branch_id | leaf_from_branch (const Branch_id bid1, const Nucleotide n1, const unsigned i, const Seq_id sid) |
Branch_id | split_edge (const Branch_id bid1, const Nucleotide n1, const unsigned i, const Nucleotide n2) |
Private Attributes | |
seq_map_ptr | ss_ |
branch_map | bm_ |
children_map | cm_ |
leaf_map | lm_ |
Branch_id | root_ |
Friends | |
class | Gdst_stats |
class | Common_substrings |
class | Ukkonen_inserter |
Generalized DNA suffix tree.
|
private |
|
private |
|
private |
typedef Seq_pos<Seq_id> vdj_pipe::gdst::Gdst::match_type |
typedef std::vector<match_type> vdj_pipe::gdst::Gdst::match_vector |
typedef detail::Id_map<Seq_id, Seq_entry> vdj_pipe::gdst::Gdst::seq_map |
typedef boost::shared_ptr<seq_map> vdj_pipe::gdst::Gdst::seq_map_ptr |
|
private |
|
inline |
|
inlineexplicit |
|
inlineprivate |
|
inlineprivate |
|
inline |
|
inline |
|
inline |
|
inlineprivate |
|
inline |
|
inlineprivate |
|
inlineprivate |
|
inline |
Common_subseq vdj_pipe::gdst::Gdst::find_longest | ( | const seq_type | seq, |
std::size_t | min_len = 0 |
||
) | const |
find longest common substring
seq | DNA sequence, no ambiguous characters |
min_len | minimal common substring length; if min_len == 0, only complete matches are considered |
void vdj_pipe::gdst::Gdst::find_overlaping | ( | const boost::string_ref | seq, |
detail::Vector_set< Seq_id > & | vs, | ||
std::size_t | min_overlap = 0 |
||
) | const |
seq | sequence of non-ambiguous nucleotides |
min_overlap | minimal overlap size; if min_overlap == 0, only fully matching sequences will be returned |
void vdj_pipe::gdst::Gdst::insert | ( | const Seq_id | sid | ) |
|
inline |
|
inlineprivate |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inline |
|
inlineprivate |
|
inline |
|
inline |
|
inline |
|
inlineprivate |
|
inlineprivate |
|
friend |
|
friend |
|
friend |
|
private |
|
private |
|
private |
|
private |
|
private |