This file contains declaration of common utility functions used in the MSA project.
More...
#include <vector>
#include <string>
Go to the source code of this file.
|
const std::vector< std::string > | VALID_FORMATS = {"fasta", "afa", "fas", "fst", "fsa", "a2m", "a3m", "sto", "clustal", "aln", "pfam"} |
|
const std::vector< std::string > | FASTA_FORMATS = {"fasta", "afa", "fas", "fst", "fsa"} |
|
const std::string | STANDARD_AMINO_ACIDS = "ACDEFGHIKLMNPQRSTVWY" |
|
const std::string | NON_STANDARD_AMINO_ACIDS = "XOUBJZ" |
|
const std::string | STANDARD_RNA_NUCLEOTIDES = "AUCG" |
|
const std::string | STANDARD_DNA_NUCLEOTIDES = "ATCG" |
|
const std::string | NON_STANDARD_NUCLEOTIDES = "N" |
|
const std::string | GAP = "-." |
|
This file contains declaration of common utility functions used in the MSA project.
◆ Alphabet
Enumerator |
---|
protein | |
RNA | |
DNA | |
◆ NonStandardHandler
Enumerator |
---|
AsStandard | |
ConsiderGapInCutoff | |
ConsiderGap | |
◆ Normalization
◆ getAllowedLetters()
std::string getAllowedLetters |
( |
Alphabet | alphabet | ) |
|
gets the list of allowed letters for the provided input alphabet
- Parameters
-
- Returns
- list of allowed letters
gets the list of allowed letters for the provided input alphabet
- Parameters
-
- Returns
◆ getFormat()
std::string getFormat |
( |
std::string | file, |
|
|
std::string | name ) |
Get the format from a file path.
- Parameters
-
file | file path. |
name | name of the file (for error messages). |
- Returns
- The format string.
◆ getNonStandardLetters()
std::string getNonStandardLetters |
( |
Alphabet | alphabet | ) |
|
gets the list of non-standard letters for the provided input alphabet
- Parameters
-
- Returns
- list of non-standard letters
gets the list of non-standard letters for the provided input alphabet
- Parameters
-
- Returns
◆ getStandardLetters()
std::string getStandardLetters |
( |
Alphabet | alphabet | ) |
|
gets the list of standard letters for the provided input alphabet
- Parameters
-
- Returns
- list of standard letters
gets the list of standard letters for the provided input alphabet
- Parameters
-
- Returns
◆ keepNonGapPositionsOfQuerySequence()
void keepNonGapPositionsOfQuerySequence |
( |
std::vector< Sequence > & | sequences | ) |
|
Keep only the positions of non-gap residues of the query sequence for all sequences.
- Parameters
-
sequences | The vector of sequences to process. |
◆ FASTA_FORMATS
const std::vector<std::string> FASTA_FORMATS = {"fasta", "afa", "fas", "fst", "fsa"} |
|
inline |
◆ GAP
const std::string GAP = "-." |
◆ NON_STANDARD_AMINO_ACIDS
const std::string NON_STANDARD_AMINO_ACIDS = "XOUBJZ" |
◆ NON_STANDARD_NUCLEOTIDES
const std::string NON_STANDARD_NUCLEOTIDES = "N" |
◆ STANDARD_AMINO_ACIDS
const std::string STANDARD_AMINO_ACIDS = "ACDEFGHIKLMNPQRSTVWY" |
◆ STANDARD_DNA_NUCLEOTIDES
const std::string STANDARD_DNA_NUCLEOTIDES = "ATCG" |
◆ STANDARD_RNA_NUCLEOTIDES
const std::string STANDARD_RNA_NUCLEOTIDES = "AUCG" |
◆ VALID_FORMATS
const std::vector<std::string> VALID_FORMATS = {"fasta", "afa", "fas", "fst", "fsa", "a2m", "a3m", "sto", "clustal", "aln", "pfam"} |