#include <prepro.h>
Public Member Functions | |
PREPRO (string &f1, string &f2) | |
void | getGenome (string &buff, int whichOne) const |
string * | gAlign (vector< KIS< GENOME_TYPE > > &kisses, long &len) |
vector< lightKIS< GENOME_TYPE > > & | lAlign (string &chunks, int whichOne) const |
vector< lightKIS< GENOME_TYPE > > & | extractGaps (string *results, vector< KIS< GENOME_TYPE > > &kisses) const |
vector< vector< lightKIS< GENOME_TYPE > > * > & | extractBPCoords (vector< lightKIS< GENOME_TYPE > > &res) |
string * | extractBP (vector< vector< lightKIS< GENOME_TYPE > > * > &res) |
void | toString (unsigned long num, string &result) const |
vector< lightKIS< GENOME_TYPE > > & | stitchHits (vector< lightKIS< GENOME_TYPE > > &res) const |
string * | GAOnStitchedHits (vector< lightKIS< GENOME_TYPE > > &stitchedHits) const |
vector< lightKIS< GENOME_TYPE > > & | extractGapsFromHits (string *results, vector< lightKIS< GENOME_TYPE > > &hits) const |
void | addToKISTable (vector< lightKIS< GENOME_TYPE > > &add, vector< lightKIS< GENOME_TYPE > > &kisTable) const |
void | print (vector< lightKIS< GENOME_TYPE > > &vec) const |
int | printToFile (vector< lightKIS< GENOME_TYPE > > &vec, string fileName) const |
Private Member Functions | |
void | transformSeq (char *arr) const |
void | getGene (FILE *f, string &buff) |
string | labelIt (GENOME_TYPE i, long count, string name) const |
void | checkStitchedHits (vector< lightKIS< GENOME_TYPE > > &res) const |
void | unionHits (lightKIS< GENOME_TYPE > &elm1, lightKIS< GENOME_TYPE > &elm2) const |
void | stitch (vector< lightKIS< GENOME_TYPE > > &res) const |
void | refineGapTable (long **gaps, long **gaps1, long **gaps2, long &len, string &seq1, string &seq2) const |
void | refineKISTable (vector< KIS< GENOME_TYPE > > &kisses, long **gaps1, long **gaps2, long len, unsigned int i, vector< lightKIS< GENOME_TYPE > > &newkis) const |
void | refineHitTable (vector< lightKIS< GENOME_TYPE > > &hits, long **gaps1, long **gaps2, long len, unsigned int i, vector< lightKIS< GENOME_TYPE > > &newhit) const |
Private Attributes | |
string | fileName1 |
string | fileName2 |
string | genome1 |
string | genome2 |
|
Constructor.
|
|
Simply adds the table "add" to the table "kisTable" ("add" is the table we get from the extractGapsFromHits method).
|
|
Checks the lengths of the stitched hits against a predefined threshold (stitchMinLen). |
|
Extracts the breakpoints out of the genomes and returns an array of two strings where both strings are a multifasta file alike. First string is all breakpoints of the first genome, Second string is all breakpoints of the second genome. Each breakpoint is recognized by its title ( >number of genome (1/2) start of breakpoint end of breakpoint)
|
|
Extracts the breakpoints coordinates out of the KIS table "res" taking into consideration the circularity of both genomes. The method returns a vector of two vector pointers where the first one includes the breakpoint coordinates of the first genome and the second for the second.
|
|
Extracts the gaps out of the global alignment results on the KIS table (uses file umr.h).
|
|
Extracts the gaps out of the global alignment results on the SIS table (uses file umr.h).
|
|
Global alignment method (uses MAFFT) (used also to globally align every table that is structured from a vector of KIS objects).
|
|
The main global alignment method for stitched hits (used also to globally align every table that is structured from a vector of lightKIS objects).. Receives the stitchedHits method's result and performs MAFFT's global alignment procedure on them. The result of the global alignment is returned as an array of strings where string 2*i and 2*i+1 are the results of the global alignment on SIS i.
|
|
Ectracts the genome from file "f" into the string "buff". Note that no title will be saved in buff, just nucleotides.
|
|
Returns one of the genomes in buff (according to whichOne flag, 0 for genome1, 1 for genome2).
|
|
An auxiliary mathod that returns the string name+i+"."+count.
|
|
Local alignment method (includes YASS).
|
|
Prints the table "vec" to the standard output.
|
|
Prints the table "vec" to the path "fileName".
|
|
Refines the gap table by saving the absolute value of the coordinates of "gaps" (gaps holds the extracted unmatched regions. see umr.h) in "gaps1" (coordinates of first genome) and "gaps2" (coordinates of second genome).
|
|
Refines the i'th hit of the hits table according to the given refined gaps for both sequences in the hit.
|
|
Refines the i'th KIS of the KIS table according to the given refined gaps for both sequences in the KIS.
|
|
Performs the action of stitching hits on a given local alignment result (which can also be held in a lightKIS object).
|
|
The main stitching method that receives the result of the local alignment and performs the procedure of stitching hits on it. The stitched hits are returned in a vector of lightKIS objects.
|
|
Converts the positive number num to a string.
|
|
An auxiliary mathod that inverts and transforms a given sequence (A<=>T , G<=>C).
|
|
Unions two stitched hits according to MAGIC's paper.
|
|
The path for the first *.anchor file. |
|
The path for the second *.anchor file. |
|
The first genome (extracted from file *.genome). |
|
The second genome (extracted from file *.genome). |