vg
tools for working with variation graphs
Public Member Functions | Protected Member Functions | Protected Attributes | List of all members
vg::VCFGenotyper Class Reference

#include <graph_caller.hpp>

Inheritance diagram for vg::VCFGenotyper:
vg::GraphCaller vg::VCFOutputCaller vg::GAFOutputCaller

Public Member Functions

 VCFGenotyper (const PathHandleGraph &graph, SnarlCaller &snarl_caller, SnarlManager &snarl_manager, vcflib::VariantCallFile &variant_file, const string &sample_name, const vector< string > &ref_paths, const vector< int > &ref_path_ploidies, FastaReference *ref_fasta, FastaReference *ins_fasta, AlignmentEmitter *aln_emitter, bool traversals_only, bool gaf_output, size_t trav_padding)
 
virtual ~VCFGenotyper ()
 
virtual bool call_snarl (const Snarl &snarl)
 Call a given snarl, and print the output to out_stream. More...
 
virtual string vcf_header (const PathHandleGraph &graph, const vector< string > &contigs, const vector< size_t > &contig_length_overrides={}) const
 Write the vcf header (version and contigs and basic info) More...
 
- Public Member Functions inherited from vg::GraphCaller
 GraphCaller (SnarlCaller &snarl_caller, SnarlManager &snarl_manager)
 
virtual ~GraphCaller ()
 
virtual void call_top_level_snarls (const HandleGraph &graph, RecurseType recurse_type=RecurseOnFail)
 
virtual void call_top_level_chains (const HandleGraph &graph, size_t max_edges, size_t max_trivial, RecurseType recurise_type=RecurseOnFail)
 
void set_show_progress (bool show_progress)
 toggle progress messages More...
 
- Public Member Functions inherited from vg::VCFOutputCaller
 VCFOutputCaller (const string &sample_name)
 
virtual ~VCFOutputCaller ()
 
bool add_variant (vcflib::Variant &var) const
 
void write_variants (ostream &out_stream, const SnarlManager *snarl_manager=nullptr)
 
void vcf_fixup (vcflib::Variant &var) const
 Run vcffixup from vcflib. More...
 
void set_translation (const unordered_map< nid_t, pair< string, size_t >> *translation)
 Add a translation map. More...
 
void set_nested (bool nested)
 Assume writing nested snarls is enabled. More...
 
- Public Member Functions inherited from vg::GAFOutputCaller
 GAFOutputCaller (AlignmentEmitter *emitter, const string &sample_name, const vector< string > &ref_paths, size_t trav_padding)
 The emitter object is created and owned by external forces. More...
 
virtual ~GAFOutputCaller ()
 
void emit_gaf_traversals (const PathHandleGraph &graph, const string &snarl_name, const vector< SnarlTraversal > &travs, int64_t ref_trav_idx, const string &ref_path_name, int64_t ref_path_position, const TraversalSupportFinder *support_finder=nullptr)
 print the GAF traversals More...
 
void emit_gaf_variant (const PathHandleGraph &graph, const string &snarl_name, const vector< SnarlTraversal > &travs, const vector< int > &genotype, int64_t ref_trav_idx, const string &ref_path_name, int64_t ref_path_position, const TraversalSupportFinder *support_finder=nullptr)
 print the GAF genotype More...
 
SnarlTraversal pad_traversal (const PathHandleGraph &graph, const SnarlTraversal &trav) const
 pad a traversal with (first found) reference path, adding up to trav_padding to each side More...
 

Protected Member Functions

tuple< string, size_t, size_t > get_ref_positions (const vector< vcflib::Variant * > &variants) const
 get path positions bounding a set of variants More...
 
virtual unordered_map< string, size_t > scan_contig_lengths () const
 munge out the contig lengths from the VCF header More...
 
- Protected Member Functions inherited from vg::GraphCaller
vector< Chainbreak_chain (const HandleGraph &graph, const Chain &chain, size_t max_edges, size_t max_trivial)
 Break up a chain into bits that we want to call using size heuristics. More...
 
- Protected Member Functions inherited from vg::VCFOutputCaller
void add_allele_path_to_info (const HandleGraph *graph, vcflib::Variant &v, int allele, const Traversal &trav, bool reversed, bool one_based) const
 add a traversal to the VCF info field in the format of a GFA W-line or GAF path More...
 
void add_allele_path_to_info (vcflib::Variant &v, int allele, const SnarlTraversal &trav, bool reversed, bool one_based) const
 legacy version of above More...
 
string trav_string (const HandleGraph &graph, const SnarlTraversal &trav) const
 convert a traversal into an allele string More...
 
bool emit_variant (const PathPositionHandleGraph &graph, SnarlCaller &snarl_caller, const Snarl &snarl, const vector< SnarlTraversal > &called_traversals, const vector< int > &genotype, int ref_trav_idx, const unique_ptr< SnarlCaller::CallInfo > &call_info, const string &ref_path_name, int ref_offset, bool genotype_snarls, int ploidy, function< string(const vector< SnarlTraversal > &, const vector< int > &, int, int, int)> trav_to_string=nullptr)
 
tuple< int64_t, int64_t, bool, step_handle_t, step_handle_tget_ref_interval (const PathPositionHandleGraph &graph, const Snarl &snarl, const string &ref_path_name) const
 
pair< string, int64_t > get_ref_position (const PathPositionHandleGraph &graph, const Snarl &snarl, const string &ref_path_name, int64_t ref_path_offset) const
 used for making gaf traversal names More...
 
void flatten_common_allele_ends (vcflib::Variant &variant, bool backward, size_t len_override) const
 
string print_snarl (const HandleGraph *grpah, const handle_t &snarl_start, const handle_t &snarl_end, bool in_brackets=false) const
 
string print_snarl (const Snarl &snarl, bool in_brackets=false) const
 legacy version of above More...
 
void scan_snarl (const string &allele_string, function< void(const string &, Snarl &)> callback) const
 
void update_nesting_info_tags (const SnarlManager *snarl_manager)
 

Protected Attributes

const PathHandleGraphgraph
 the graph More...
 
vcflib::VariantCallFile & input_vcf
 input VCF to genotype, must have been loaded etc elsewhere More...
 
VCFTraversalFinder traversal_finder
 
bool traversals_only
 toggle whether to genotype or just output the traversals More...
 
bool gaf_output
 toggle whether to output vcf or gaf More...
 
unordered_map< string, int > path_to_ploidy
 the ploidies More...
 
- Protected Attributes inherited from vg::GraphCaller
SnarlCallersnarl_caller
 Our Genotyper. More...
 
SnarlManagersnarl_manager
 Our snarls. More...
 
bool show_progress
 Toggle progress messages. More...
 
- Protected Attributes inherited from vg::VCFOutputCaller
vcflib::VariantCallFile output_vcf
 output vcf More...
 
string sample_name
 Sample name. More...
 
vector< vector< pair< pair< string, size_t >, string > > > output_variants
 
size_t max_uncalled_alleles = 5
 print up to this many uncalled alleles when doing ref-genotpes in -a mode More...
 
const unordered_map< nid_t, pair< string, size_t > > * translation
 
bool include_nested
 
- Protected Attributes inherited from vg::GAFOutputCaller
AlignmentEmitteremitter
 
string gaf_sample_name
 Sample name. More...
 
size_t trav_padding = 0
 
unordered_set< string > ref_paths
 Reference paths are used to pad out traversals. If there are none, then first path found is used. More...
 

Additional Inherited Members

- Public Types inherited from vg::GraphCaller
enum  RecurseType { RecurseOnFail, RecurseAlways, RecurseNever }
 
- Static Protected Attributes inherited from vg::VCFOutputCaller
static const int64_t max_vcf_line_length = 2000000000
 

Detailed Description

VCFGenotyper : Genotype variants in a given VCF file

Constructor & Destructor Documentation

◆ VCFGenotyper()

vg::VCFGenotyper::VCFGenotyper ( const PathHandleGraph graph,
SnarlCaller snarl_caller,
SnarlManager snarl_manager,
vcflib::VariantCallFile &  variant_file,
const string &  sample_name,
const vector< string > &  ref_paths,
const vector< int > &  ref_path_ploidies,
FastaReference *  ref_fasta,
FastaReference *  ins_fasta,
AlignmentEmitter aln_emitter,
bool  traversals_only,
bool  gaf_output,
size_t  trav_padding 
)

◆ ~VCFGenotyper()

vg::VCFGenotyper::~VCFGenotyper ( )
virtual

Member Function Documentation

◆ call_snarl()

bool vg::VCFGenotyper::call_snarl ( const Snarl snarl)
virtual

Call a given snarl, and print the output to out_stream.

Implements vg::GraphCaller.

◆ get_ref_positions()

tuple< string, size_t, size_t > vg::VCFGenotyper::get_ref_positions ( const vector< vcflib::Variant * > &  variants) const
protected

get path positions bounding a set of variants

◆ scan_contig_lengths()

unordered_map< string, size_t > vg::VCFGenotyper::scan_contig_lengths ( ) const
protectedvirtual

munge out the contig lengths from the VCF header

◆ vcf_header()

string vg::VCFGenotyper::vcf_header ( const PathHandleGraph graph,
const vector< string > &  contigs,
const vector< size_t > &  contig_length_overrides = {} 
) const
virtual

Write the vcf header (version and contigs and basic info)

Reimplemented from vg::VCFOutputCaller.

Member Data Documentation

◆ gaf_output

bool vg::VCFGenotyper::gaf_output
protected

toggle whether to output vcf or gaf

◆ graph

const PathHandleGraph& vg::VCFGenotyper::graph
protected

the graph

◆ input_vcf

vcflib::VariantCallFile& vg::VCFGenotyper::input_vcf
protected

input VCF to genotype, must have been loaded etc elsewhere

◆ path_to_ploidy

unordered_map<string, int> vg::VCFGenotyper::path_to_ploidy
protected

the ploidies

◆ traversal_finder

VCFTraversalFinder vg::VCFGenotyper::traversal_finder
protected

traversal finder uses alt paths to map VCF alleles from input_vcf back to traversals in the snarl

◆ traversals_only

bool vg::VCFGenotyper::traversals_only
protected

toggle whether to genotype or just output the traversals


The documentation for this class was generated from the following files: