c++project
HW1_student_code_example/FASTA_readset.cpp
#include "FASTA_readset.h" // ******************************************************** Constructors & Destructor Definitions ******************************************************************* // --------------------------------------------------------------------- Ctor FASTA_readset::FASTA_readset(const char *path,int name_length) { total_read_size = 10; // Default value single_sequence_length = 50; // each sequence is 50 chars long num_of_data_sets = 14; // 14 data sets available // Initializing to NULL before allocating memory: all_genomic_sequence = NULL; data_sets_total_reads = NULL; data_sets_unique_read_counts = NULL; file_path = NULL; // ---------- Memory Allocation -------------- try { // -------- Allocating memory for holding file path name file_path = new char[name_length+1]; // 1 extra space for terminating null character ('\0') // Now, copying the file path name for(int i=0;i<=name_length;i++) { if(i!=name_length) { file_path[i] = path[i]; } else { file_path[i] = '\0'; } } // --------- Allocating memory for storing seq data all_genomic_sequence = new char*[total_read_size]; for(int i=0;i<total_read_size;i++) { all_genomic_sequence[i] = new char[single_sequence_length]; } // ------------ Allocating memory for data set letter freq info data_set_letter_frequency = new int*[num_of_data_sets]; for(int i=0;i<num_of_data_sets;i++) { data_set_letter_frequency[i] = new int[4]; // 4 Letters: A, T, G, C } //Initializing with zero counts for(int i=0;i<num_of_data_sets;i++) { data_set_letter_frequency[i][0] = 0; data_set_letter_frequency[i][1] = 0; data_set_letter_frequency[i][2] = 0; data_set_letter_frequency[i][3] = 0; } // ------- Allocating memory for storing a total, current, and unique read counts // of all 14 of the data sets data_sets_total_reads = new int[num_of_data_sets]; //Initializing with zeros for(int i=0;i<num_of_data_sets;i++) { data_sets_total_reads[i] = 0; } data_sets_current_read_count = new int[num_of_data_sets]; //Initializing with zeros: for(int i=0;i<num_of_data_sets;i++) { data_sets_current_read_count[i] = 0; } data_sets_unique_read_counts = new int[num_of_data_sets]; //Initializing to zero for(int i=0;i<num_of_data_sets;i++) { data_sets_unique_read_counts[i] = 0; } } catch(bad_alloc& exception) { cout<<"Dynamic Memory Allocation Failed Inside Overloaded Constructor."<<endl; cout<<"\tDetials: "<<exception.what()<<endl; exit(EXIT_FAILURE); } } // ------------------------------------------------------------------------------------ Overloaded ctor FASTA_readset::FASTA_readset(const char *path,int name_length,int lines_to_read) { total_read_size = lines_to_read; // Given value single_sequence_length = 50; // each sequence is 50 chars long num_of_data_sets = 14; // 14 data sets available // Initializing to NULL before allocating memory: all_genomic_sequence = NULL; data_sets_total_reads = NULL; file_path = NULL; // ---------- Memory Allocation -------------- try { // -------- Allocating memory for holding file path name file_path = new char[name_length+1]; // 1 extra space for terminating null character ('\0') // Now, copying the file path name for(int i=0;i<=name_length;i++) { if(i!=name_length) { file_path[i] = path[i]; } else { file_path[i] = '\0'; } } // --------- Allocating memory for storing seq data all_genomic_sequence = new char*[total_read_size]; for(int i=0;i<total_read_size;i++) { all_genomic_sequence[i] = new char[single_sequence_length]; } // ------------ Allocating memory for data set letter freq info data_set_letter_frequency = new int*[num_of_data_sets]; for(int i=0;i<num_of_data_sets;i++) { data_set_letter_frequency[i] = new int[4]; // 4 Letters: A, T, G, C } //Initializing with zero counts for(int i=0;i<num_of_data_sets;i++) { data_set_letter_frequency[i][0] = 0; data_set_letter_frequency[i][1] = 0; data_set_letter_frequency[i][2] = 0; data_set_letter_frequency[i][3] = 0; } // ------- Allocating memory for storing a total read counts // of all 14 of the data sets data_sets_total_reads = new int[num_of_data_sets]; //Initializing with zeros for(int i=0;i<num_of_data_sets;i++) { data_sets_total_reads[i] = 0; } data_sets_current_read_count = new int[num_of_data_sets]; //Initializing with zeros: for(int i=0;i<num_of_data_sets;i++) { data_sets_current_read_count[i] = 0; } data_sets_unique_read_counts = new int[num_of_data_sets]; //Initializing to zero for(int i=0;i<num_of_data_sets;i++) { data_sets_unique_read_counts[i] = 0; } } catch(bad_alloc& exception) { cout<<"Dynamic Memory Allocation Failed Inside Overloaded Constructor."<<endl; cout<<"\tDetials: "<<exception.what()<<endl; exit(EXIT_FAILURE); } } // ----------------------------------------------------------------------------- Class dtor FASTA_readset::~FASTA_readset() { // ------------- RELEASE the KRAKEN(!!!) - the array holding the read seq data ----------------------------- time_t start = time(nullptr); for(int i=0;i<total_read_size;i++) { // De-allocating the sub-arrays delete[] all_genomic_sequence[i]; } // Now, de-allocate the main array delete[] all_genomic_sequence; // ------------------------------ Releasing other Memories ----------------------------------------------------- // Releasing data set count memory delete[] data_sets_total_reads; // Releasing the file path array memory delete[] file_path; // Releasing letter frequency data: for(int i=0;i<num_of_data_sets;i++) { delete[] data_set_letter_frequency[i]; } delete[] data_set_letter_frequency; // Releasing current read count memory delete[] data_sets_current_read_count; // Releasing unique read counts memory delete[] data_sets_unique_read_counts; // Getting ending timestamp time_t end = time(nullptr); time_t duration = end-start; cout<<"\n\t\tTime (in seconds) Required to Release All Memory = "<<duration<<endl; cout<<"\n\t\t All Dynamically Allocated Memories Have Been Released. Exiting Program Now."<<endl; } // ********************************************************** Remaining Member Function Definitions **************************************************************** void FASTA_readset::Read_Data_From_File() { // ---------- Read the data from the input file -------- // If file_path is still NULL, exit the program. if(file_path==NULL) { cout<<"NULL File Path Encountered. Exiting Program"<<endl; exit(EXIT_FAILURE); } // Open and Read from the file try { // Getting the starting timestamp time_t start = time(nullptr); ifstream input_file_stream; input_file_stream.open(file_path); int lines_read = 0; int seq_index = 0; // Index indicating location to store the current sequence int header_or_seq_flag = 0; // 1 = sequence line char temp_header[max_read_header_length]; char *token = NULL; // For tokenizing the header line int token_number; // Indicates serial number of the token. There should be 15 (0 to 14) tokens (including the read id). int data_set_read_count = 0; // Storing the read count of the seq for the data set obtained from atoi(token) int temp_read_count; // A temporary read count int freq_A,freq_T,freq_G,freq_C; // For holding the frequency of the letters in the read sequence while ((!input_file_stream.eof()) && lines_read<(2*total_read_size) && seq_index<total_read_size) { if(lines_read==0) { header_or_seq_flag = 0; // We are reading the first read header } // We are avoiding costly modulo operation (%) // by keeping track of the flag value. // It's a header line if(header_or_seq_flag==0) { // Process the information in the header input_file_stream>>temp_header; // Tokenize the header using '_' as the delimiter if(token!=NULL) { token = NULL; } token = strtok(temp_header,"_"); token_number = 0; while(token!=NULL) { if(token_number!=0) // Ignoring the read number in the read header { data_set_read_count = atoi(token); data_sets_total_reads[(token_number-1)] += data_set_read_count; data_sets_current_read_count[(token_number-1)] = data_set_read_count; if(data_set_read_count>0) { data_sets_unique_read_counts[(token_number-1)] += 1; } } token = strtok(NULL,"_"); token_number++; } // Modify the flag header_or_seq_flag = 1; } // It's a sequence line else { // Process the sequence line information input_file_stream>>all_genomic_sequence[seq_index]; // Find out the frequency of the letters A,T,G,C in the read sequence: freq_A = 0; freq_T = 0; freq_G = 0; freq_C = 0; this->Count_Letter_Frequency(all_genomic_sequence[seq_index],freq_A,freq_T,freq_G,freq_C); // Now update the letter frequency counts for each of the 14 data sets // using the current read count info: for(int i=0;i<num_of_data_sets;i++) { temp_read_count = data_sets_current_read_count[i]; data_set_letter_frequency[i][0] += temp_read_count * freq_A; // Updating the freq count of letter A for the i-th data set data_set_letter_frequency[i][1] += temp_read_count * freq_T; // Updating the freq count of letter T for the i-th data set data_set_letter_frequency[i][2] += temp_read_count * freq_G; // Updating the freq count of letter G for the i-th data set data_set_letter_frequency[i][3] += temp_read_count * freq_C; // Updating the freq count of letter C for the i-th data set } // Increment index seq_index++; // Modify the flag header_or_seq_flag = 0; } lines_read++; } // While(...) ends here // File reading done. // Close the file stream. if(input_file_stream.is_open()) { input_file_stream.close(); } } catch(const std::exception& e) { cout<<"Error Encountered While Trying Open & Read From the Input File. Exiting Program."; cout<<"\tDetails: "<<e.what()<<endl; exit(EXIT_FAILURE); } } void FASTA_readset::Compute_All_Stats() { cout<<"---------------- Total Number of Unique Sequence Fragments in Each Data Set --------------------"<<endl; for(int i=0;i<num_of_data_sets;i++) { cout<<"Data Set-"<<(i+1)<<" Unique Count = "<<data_sets_unique_read_counts[i]<<endl; } cout<<endl<<endl; cout<<"--------------- Total Read Counts for Each Data Sets ------------------------------------------------"<<endl; for(int i=0;i<num_of_data_sets;i++) { cout<<"Data Set-"<<(i+1)<<" Totla Read Count = "<<data_sets_total_reads[i]<<endl; } cout<<endl<<endl; cout<<"-------------------------- Letter Frequency for Each Data Sets ----------------------------------------------"<<endl; for(int i=0;i<num_of_data_sets;i++) { cout<<"Data Set-"<<(i+1)<<" : "; for(int j=0;j<4;j++) { switch (j) { case 0: cout<<" A = "<<data_set_letter_frequency[i][j]; break; case 1: cout<<" T = "<<data_set_letter_frequency[i][j]; break; case 2: cout<<" G = "<<data_set_letter_frequency[i][j]; break; case 3: cout<<" C = "<<data_set_letter_frequency[i][j]; break; default: // do nothing ; } } cout<<endl; } } //******************************************************** Helper Member Functions **************************************************************** void FASTA_readset::Count_Letter_Frequency(const char* seq,int& a,int& t,int& g,int& c) { for(int i=0;i<single_sequence_length;i++) { if(seq[i]=='A') { a++; } else if(seq[i]=='T') { t++; } else if(seq[i]=='G') { g++; } else if(seq[i]=='C') { c++; } } } bool FASTA_readset::Is_SeqA_Greater_Than_SeqB(const char* A,const char* B) { string a(A); string b(B); int compare_result = a.compare(b); if(compare_result<0) { return true; } else { return false; } } void FASTA_readset::Sort_Seq_Data() { // Perforing Insertion Sort on the sequence array char key[single_sequence_length]; char temp_a[single_sequence_length]; char temp_b[single_sequence_length]; int compare_result; int i,j; for(i=1;i<total_read_size;i++) { for(int index=0;index<single_sequence_length;index++) { key[index] = all_genomic_sequence[i][index]; } j = i-1; while(j>=0 && !Is_SeqA_Greater_Than_SeqB(all_genomic_sequence[j],key)) { for(int index=0;index<single_sequence_length;index++) { all_genomic_sequence[j+1][index] = all_genomic_sequence[j][index]; } j--; } for(int index=0;index<single_sequence_length;index++) { all_genomic_sequence[j+1][index] = key[index]; } } cout<<"-------------------- Printing First 20 elements from the Sorted Sequence Array -------------------------------"<<endl; for(int i=0;i<20;i++) { cout<<"Seq at Index "<<i<<" = "; for(int j=0;j<single_sequence_length;j++) { cout<<all_genomic_sequence[i][j]; } cout<<endl; } }
HW1_student_code_example/FASTA_readset.h
#ifndef FASTA_READSET_H_INCLUDED #define FASTA_READSET_H_INCLUDED #include <iostream> #include <string.h> #include <stdlib.h> #include <fstream> #include <ctime> using namespace std; class FASTA_readset { public: // Ctor with input filepath to read the entire file FASTA_readset(const char*,int); // pointer to file path name, length of the file path name // Overloaded ctor with input filepath to read the specified number of lines from the file FASTA_readset(const char*,int,int); // pointer to file path name, length of the file path name, #of lines to read // Default dtor ~FASTA_readset(); // Function for reading data from input file void Read_Data_From_File(); // Function for computing and printing all stats void Compute_All_Stats(); // Function for solving sub-problem A void Compute_A(); // Function for solving sub-problem B void Compute_B(); // Function for solving sub-problem C void Compute_C(); // Function for sorting the read seq data void Sort_Seq_Data(); private: // Total number of sequences to read from the source // file into the memory. int total_read_size; // Length of each sequence int single_sequence_length; // Number of data sets int num_of_data_sets; // A 2D [size: 36M-by-50] char array for storing all the seuquences read char **all_genomic_sequence; // An integer array [size: 1-by-14] for storing the total read counts int *data_sets_total_reads; // An integer array for [size: 1-by-14] for storing the unique read counts int *data_sets_unique_read_counts; // An integer array [size: 1-by-14] for holding the current read-count values only int *data_sets_current_read_count; // An integer array [size: 14-by-4] for stroing letter frequency for each data set int **data_set_letter_frequency; // Serial: frequency of A,T,G,C // Path to the source data file char *file_path; // Assuming max length of the read header is 1024 Bytes (1KB) int max_read_header_length = 1024; // -------------------- Helper Member Functions ----------------------------------------------------- // Will count the frequerncy of the letters A,T,G,C in the given sequence. void Count_Letter_Frequency(const char*,int&,int&,int&,int&); // For determining alphabetical order of seniority between two sequences. bool Is_SeqA_Greater_Than_SeqB(const char*,const char*); }; #endif
HW1_student_code_example/INF503_HW1_MdNazmul_Hossain.pdf
INF503 HW-1 (Spring-2021) Md Nazmul Hossain (mh2752@nau.edu)
Problem A:
For initializing the data structure with the first 1 million reads, it took 1 second (measured inside the main.cpp using the <ctime> library) and the CPU time obtained using ‘jobstats -r’ was 3 seconds. The memory requirement for storing 1 million sequence data (each sequence having 50 characters exactly) is 50 Megabytes. From this, we can assume that for doing the same with all 36 million reads, the CPU time would be around 36 to 108 seconds (36 times the time required for 1 million reads) and memory requirement will be around 1800 Megabytes (1.8 Gigabytes). However, memory requirements might slightly vary because of additional memory requirements during the initialization and computation stage.
Problem B:
The CPU time for reading and initializing with all 36 million reads was 53 seconds and the memory utilised was 2.41 Gigabytes (0.61 Gigabytes more than predicted 1.8 Gigabytes). I think these discrepancies are acceptable as they fall close to the predicted values (some additional memories are consumed by the running program also). Problem C: The number of unique sequence fragments in each of the 14 data sets:
Total number of read counts for each data sets:
Frequency of A,T,G,C characters in each data sets:
Problem D: For de-allocating all the memories associated with the 36 million reads, it took 1 second (approximate measure) as seen in the following screenshot:
As the compiler doesn’t have to explicitly empty the each memory location but only needs to mark the specific memory block as free, it takes much shorter time than reading and initializing the arrays with the 36 million reads.
Problem-E: Sorting Algorithm used: Insertion sort (Worst Case Complexity: O(n^2)). With 36 million reads, the sequences could not be sorted within a reasonable time. With a reduced size (100000), it took 621 seconds (10 minutes 21 seconds) to alphabetically sort the sequences:
As the time complexity of the approach here is quadratic, for sorting 36 million read sequences, it would approximately take (360)^2 * 621 seconds (80481600 seconds OR, approximately 31 months).
HW1_student_code_example/INF503HW1.sh
#!/bin/bash #SBATCH --job-name=mh2752_INF503_HW1 # the name of your job #SBATCH --output=/scratch/mh2752/mh2752_INF503_HW1.output # this is the file your output and errors go to #SBATCH --chdir=/home/mh2752/INF503/HW1/ # your work directory #SBATCH --time=6:00:00 # max time to run the program = 6 HRS #SBATCH --mem=4000 # (total mem) 4GB of memory #SBATCH -c1 # 1 cpu #SBATCH --mail-type=ALL # Receive emails for all job stats change. Remove this line to receive no email updates. # Uncomment the line below to run subproblem A #srun ./output "/common/contrib/classroom/inf503/hw_dataset.fa" A # Uncomment the line below to run subproblem B #srun ./output "/common/contrib/classroom/inf503/hw_dataset.fa" B # Uncomment the line below to run subproblem C #srun ./output "/common/contrib/classroom/inf503/hw_dataset.fa" C # Uncomment the line below to run subproblem E srun ./output "/common/contrib/classroom/inf503/hw_dataset.fa" E
HW1_student_code_example/main.cpp
#include "FASTA_readset.h" int main(int c,char **argv) { if(c!=3) { cout<<"Required number of Command Line Inputs Not Supplied. Run the Program Again."<<endl; } else { string filepath(argv[1]); int path_length = filepath.length(); // A char array holding the file path details char fp[path_length]; for(int i=0;i<path_length;i++) { fp[i] = filepath[i]; } string problem_choice(argv[2]); if(problem_choice.compare("A")==0) { // ------------------------------- Solve Problem A & Show Results ---------------------------------------------------------------------- // Creating FASTA_readset object: FASTA_readset frst(fp,path_length,1000000); // arg1 = file path to data file, arg2 = length of the file path, arg3 = number of sequences to read // Getting starting timestamp time_t start = time(nullptr); // Initializing the Array with first 1 Million Reads frst.Read_Data_From_File(); // Getting ending timestamp time_t end = time(nullptr); time_t duration = end-start; cout<<"\nTime (in seconds) Required to Initialize the Memory with 1 Million reads = "<<duration<<endl; } else if(problem_choice.compare("B")==0) { // Solve Problem B (read all 36Mil data) & Show Results // Creating FASTA_readset object: FASTA_readset frst(fp,path_length,36000000); // arg1 = file path to data file, arg2 = length of the file path, arg3 = number of sequences to read // Getting starting timestamp time_t start = time(nullptr); // Initializing the Array with first 1 Million Reads frst.Read_Data_From_File(); // Getting ending timestamp time_t end = time(nullptr); time_t duration = end-start; cout<<"\nTime (in seconds) Required to Initialize the Memory with 36 Million reads = "<<duration<<endl; } else if(problem_choice.compare("C")==0) { // Solve Problem C & Show Results (Compute all stats with 36Mil reads) // Getting the First timestamp: time_t start = time(nullptr); // Creating FASTA_readset object: FASTA_readset frst(fp,path_length,36000000); // arg1 = file path to data file, arg2 = length of the file path, arg3 = number of sequences to read // Initializing the Array with first 36 Million Reads frst.Read_Data_From_File(); // Calling the Appropriate Member Function(s) frst.Compute_All_Stats(); time_t end = time(nullptr); time_t duration = end-start; cout<<"Total time to read data and compute all stats with 36Mil reads = "<<duration<<endl; } else if(problem_choice.compare("E")==0) { // Solve Problem E & Show Results // Creating FASTA_readset object: FASTA_readset frst(fp,path_length,100000); // arg1 = file path to data file, arg2 = length of the file path, arg3 = number of sequences to read // Initializing the Array with first 1 Million Reads frst.Read_Data_From_File(); // Getting starting timestamp time_t start = time(nullptr); frst.Sort_Seq_Data(); // Getting ending timestamp time_t end = time(nullptr); time_t duration = end-start; cout<<"\nTime (in seconds) Required to Sort the Read Sequences Alphabetically = "<<duration<<endl; } else if(problem_choice.compare("D")==0) { cout<<" Destructor already implemented. If you choose problem A, B, C, or E - the destructor will execute automatically."<<endl; } else { cout<<"Wrong Problem Choice. Try Again."<<endl; } } return 0; }
HW1_student_code_example/makefile
output: main.o FASTA_readset.o g++ main.o FASTA_readset.o -o output main.o: main.cpp g++ -c main.cpp FASTA_readset.o: FASTA_readset.cpp FASTA_readset.h g++ -c FASTA_readset.cpp clean: rm *.o output
HW1_student_code_example/readme.txt
Any specialized module requirements: None (Just need to have make and g++ available on the platform) Running the program from command line: General format: output "path_to_the_input_data_file" subproblem_name e.g.: To run the program for solving subproblem B with input file being located at your home folder (assuming a Windows environment) with the file name being 'hw_dataset.fa', the command should be as following: output "C:\\Users\\your_user_name\\hw_dataset.fa" B [Here, output is the executable file created after you've run the makefile (or compiled the .h and .cpp files with g++). Replace B with A or C or E to run the program for those subproblems.] *** Subproblem D (destructor) runs automatically after each subproblem is run. No need to run it explicitely.
HW1_student_code_example/sample_hw_dataset.fa.txt
>R0_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GTAACTGAACTGTTTGGTCAGCTCAGCGACTACAGACGACTTGTAGTAAT >R1_0_0_0_0_0_0_0_0_0_1_0_0_0_0 AGGGGCAGGCGTACGGCCTTTTCTTCGCGCTCGTCGCGAACGACCGCGCG >R2_0_0_0_1_0_0_0_1_0_0_0_0_0_0 AATGGCTTTTTTTCCAAAGATAAACCGAATTTTTTAATATATTTACTGAC >R3_0_0_0_0_0_0_0_0_0_0_0_0_1_1 GTGACCCAGAAACCCAACCGATCATGATGCGTCTGCAATCGGATCTGGTT >R4_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TTCCGAAAGCTGTACTAAGCCTTTCAGCAGTTGCTTTTGCTTGAGTGGGT >R5_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ACGAGAACTGATAGCCGGCCGTCACCGCGACGCGCTGCTCCGCCTGCGCG >R6_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGTCGAAGGATGTCGGTAAATCGATATTCTGTGTCGAAACGTCGATATAA >R7_0_4_0_0_0_0_0_0_0_0_0_0_0_0 AAACATGTTGATACAACTGAGTACATTAAACTAGACTATAGCTATTCATA >R8_0_0_0_0_0_0_0_1_0_0_0_0_0_0 ACAAAGAAGGTTGGTTTTTCTGGTTTTGGCCTTCCTGCCTGAATCCAAGT >R9_0_0_0_0_0_0_0_0_0_0_0_0_0_1 ACCATTAATTGATTTTGTTCAGATGCACATCCATTTGTGGGAATGGAATT >R10_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCCGGCGGCTATGCGAAGGACGCGACGACGTTCAGCGAATTCCTGTGGGC >R11_0_0_3_0_0_0_0_0_0_0_0_0_0_0 AACTACTATGATAACCCCATGAATGTTTATGAGCTACATTTAGCCTCATG >R12_3_0_0_0_0_0_0_0_0_0_0_0_1_0 TTATTCCTTCGGTTTAACCTACGGTTATAACCACGGCGAACCGATTGCCA >R13_1_0_0_0_0_0_0_0_0_0_0_0_0_1 GCATTATTGATTGACTCAAAAGACAATTTCACATTTACCGCTAAGGTAAG >R14_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AAATAGCACCAGCAAGTTTTATACAAGAGCATAGTTTTATAATTAAAACA >R15_0_0_2_0_0_0_0_0_0_0_0_0_0_0 GATATTGATAATCCTGATAGTTATATTATCAATATTAAATACTGATAAGG >R16_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATGTAATGAATGGAGCTTGGGTTGCCCGGGTTTTTTCCATAAATCCATTT >R17_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TATTCAATACAAACCAATGATTAAACAAGGGAACGAATTAGAGAGCAGCG >R18_0_0_0_0_0_2_0_1_0_0_0_0_0_0 AATAAGCGTCGTACCAATAATTCCGGCTGTTAATGCAACAGCTCCTAGAC >R19_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGGCAACGGCTATCTGGAACGCCGCCGCAACATGGTCGGCGGCACGCCGC >R20_0_0_2_0_0_0_0_0_0_0_0_0_0_0 ATAAAATGAACTTATACCTAAATCAGTATATCTTATAGTTTTTATCATAA >R21_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TCAAATGGACGTATCCAATTTGCATTACCGGTATCGTTCTTGGGTTATTC >R22_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TTTTAGCCCCGCGGAGTCTGATCCTGATGGCGGATGAAGCGTGGGGGATC >R23_0_0_0_0_0_0_0_0_0_1_2_0_0_0 CAGGTTGCCCGACCAGACCGGGCCCGTGCCGTCGACGAACTTCGTGAGCG >R24_0_0_0_0_0_0_0_0_0_1_0_1_0_0 ATTCGATACGCCGAGTTTCCGCGCCGCCCGGCGGAAGCTCTGCAGTTCGG >R25_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATATTTGCAACCGATCTCGCAACACGTGTGCTAAGAGATGTCGAATAGCT >R26_0_0_0_1_0_0_0_0_1_0_0_0_0_0 AAAGATGTAACAACAGCGATATTTCAATTTATATTCCCGTTTTCATTTAA >R27_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GAGTCGCGGCGCACGCTCGCGACGAAAGCATGAAACAATGATCGGCCGGC >R28_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GTGGTAATTGTTCTTGCANTTCTAATCCACGTCTTGCGATCGTGAATGCG >R29_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GTATCGAGGGGCGCCGCCTGCGTGATCTGGAAGCCGCCGATGAAGGATGC >R30_0_0_0_0_0_0_0_0_0_0_0_0_0_2 TGCGCCATTGTAGACAGAGCGTGCGTAGGGTTCAAGTAGGCCAATATCCC >R31_1_0_0_0_0_0_0_0_0_0_0_0_0_1 CAACTCTTGGTATCGGTTACCGCTTTGCCTTTAAAGCAAGAATCAATGTG >R32_0_0_0_0_0_0_0_0_0_0_0_0_1_1 CTTGTGTTGAGCGCGAAGAGATCGCCCGTGATTTTGTGACCTTCTGGCTA >R33_0_0_0_1_0_0_1_0_0_0_0_0_0_0 CTACAACTATTAATAGGAGGTTTATATTTGAATAACGTTAAACAATATCG >R34_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CCAATTTCATCATTTCGAGTAGTCGTTAATGAAACTGATAAATCTCCTTT >R35_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CTGCCGCCGTACGACGTGCTCGATGCGATCATGCGCCTGTACATGGAGGA >R36_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATAACTTTGATAATTCATTAATTAAGAGAATCAATAAGATTTTTTCATTA >R37_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AAGACTTACCTATCTCAAACCTGTTAAAAAACAAAAAACTATCGAAAGCA >R38_0_0_0_0_0_0_0_0_0_0_0_2_0_0 GAATACGTCAACGTGAACTCTTCGGACTGCGCATGGTGATAGCCGTACAG >R39_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AAGCAATTTAAAAAAATGATCTGCTGTTTTCGCGATTACAGTTGCATCTT >R40_0_0_0_0_0_0_0_0_0_0_1_1_0_0 CTCCTGGAAGCACGTCAATGTGGGACAAGACATTTTTCATCCGATTGCTC >R41_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TTAACTACAATCCGCCGCAAGGGGTAGCACCTGAACGAAGAAAAGAAGCG >R42_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTGGTTCAATTTTTGGTTGGTTAGGATTGTTATTTGCGGGCATGCCAGTA >R43_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CATGAAGACGGCGGGCGGCCGCAAGGTCATCAACGCCCGCCGCGCGAAGG >R44_0_0_0_0_0_0_0_0_0_0_0_0_2_1 TTCAATTTATAAACAGTACCTAGTCTCGCTGTTAATGCTGAGTCTGAATA >R45_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CTTTGATTTGCCGCCGCGTTTATAAAGAACCGATGAGTCATGAAGAGGCC >R46_0_0_0_1_0_0_0_1_1_0_0_0_0_0 AGAAGGGATTACCTATGTGGATGAGTTAAAAGTAGGGTATGCATCAGAAG >R47_0_2_0_0_0_0_0_0_0_0_0_0_0_0 TGCCTCACAGCCTACTTGCTCTTTAAGTTCAGTTAAAGTTACAGATATCC >R48_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CACGCTGCAAGTGGCTCATGGCGAAGTGGTCGCTGTTGATGGTGAAGCCA >R49_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ACTTAAAGAGCGACCATCCATAACACGGCCTGTGAAAATATCTACAAGTA >R50_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TCTATTTGGGTTATTATATACAGCTAATTTTTCTACGAGTTTCTTACTAG >R51_0_0_0_0_0_0_0_0_0_0_0_0_0_2 CATGATACGCCGAGCAAGCATCTATTTAATAACGCGTCTCGGGCGTTCAG >R52_0_0_0_0_0_0_1_1_0_0_0_0_0_0 ATATGCAATATTTCATATTAGAACTCTACAATACATGAATAAGAAACTTA >R53_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CACATGTACGCTTTCTGCTCAATAGTCTGGTTGCGCCTATTCAGTACGCA >R54_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTCAAATATGTTTAATTGTAGGTGCAGTATTAGCGTTCGTTTCAACTGTA >R55_0_2_2_0_0_0_0_0_0_0_0_0_0_0 TTAAAATCATTAGATCAAATAAAATTTAACTAGCAAAAAGTGATTTAGTA >R56_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTCGGCTGGCGGATCTTCTGAGAATGTTTTAATTGTAAAAGCATTATCTT >R57_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACCGTCCATCACGCCTGCCTCAACCATTTCTTGTCCTCCGCCAGGATATA >R58_0_0_0_0_0_0_0_0_0_1_0_1_0_0 GAATCAGCCCGGCATTGTTCTGGATCGCACTCCCGCGAACGTCGGCCGTG >R59_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTCTCAACGCTGATCTTCATCGTGTGGATACGTGGCGCAAATTCAGAGAT >R60_0_0_1_0_0_0_0_0_0_0_0_0_0_0 ATAACAACTACAGAAAAAAATAAAATTAATGAATTTATTGACACAAATAG >R61_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GCAGGCATCGCAATATAACACAAGCATAGTGGAGCGAAGTGTCTCAAACG >R62_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GCCCACCAGTTGCCGGTTAAACGGTATTGATATTCGATTGAGCTGGTGGC >R63_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATTACGTTTATTTCCTCAGTAGGGATTACAACTGGAAAAGTGATAACTGG >R64_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACGACCCCCCCAAGCATCTTCATATGGGCATGTCTTTGTGTGTTCGTGTG >R65_0_0_0_0_0_0_0_0_1_0_0_0_0_0 GAGATGTTTTGGATGTTGTTCATTTCGAGCCCAATGAGTGCCCAAGCTCT >R66_0_0_0_0_0_0_0_0_0_1_0_1_0_0 TCTCGGCGCGATAGCGCAGCACGTCGGCGAAATTGGCCGCGGGCGCGAGC >R67_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GTTGGGTTTCACCGCGCTCAAGGAGCAATTCGTTGCTCGAAAGTAGGGTG >R68_1_0_0_0_0_0_0_0_0_0_0_0_0_1 CTGAGCGAGCACTCCGGGATTGCCCGGCGCATTTTGCACCGTGGCGATGA >R69_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TGCAGGCTATAAGATCAATGTGAAAGTGAACCCTGCATTTGTACGCACTA >R70_0_1_2_0_0_0_0_0_0_0_0_0_0_0 TTCTATTAACAACTTCTACAACACTAGCATTACGCATTTTTCTGAAGTTC >R71_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ACACTGTTAAGTCTCCATCAGCCTTAGTTTTCTGATTTAGCATCGTCACA >R72_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TGCCATTTCGTGTTGATCGCTTAAAAACCGGCACACCACCACGTATCGAT >R73_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATTCGCTCCGCTTAAAGAATACGAAATCGCTTCCTCCGCACTATATATAC >R74_0_0_0_0_0_0_0_0_0_0_0_0_0_1 AAGCCGCCCCGAAAGGCGGCTGAAAGTGTGCAAGCAAAGGTGTTAAGTTG >R75_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TAATTCAAGGTGAGCGTGAAATGGCTTCTGCAAACAAATCTTTAGGTAGA >R76_0_0_0_0_0_0_0_0_0_2_0_0_0_0 TACCACGTCCGCAACATTGTCAATGTTTGTCATTTCGCTGCCGCAAATTC >R77_0_0_0_0_0_1_0_1_0_0_0_0_0_0 CTTTTTTCCCGTCCTTTTGAAGTAAATTTCGTAATCGTTCCGCTTCTGCT >R78_0_0_0_0_0_0_0_0_0_0_2_0_0_0 GCGATGAGCGTGCGCAGGTCCTCGCGCGGGCTCGTGCCTTTCGAGGCGAC >R79_0_0_0_0_0_1_0_1_0_0_0_0_0_0 GTACCTTCTGTAAGACCGAAATCATCTGCATTTACAATTAATTTAATCAT >R80_0_2_2_0_0_0_0_0_0_0_0_0_0_0 CTGTCACAGTCGGGTTTTAAAACTGCTGTTGTTTCTAAAGTCTTTCCAAC >R81_0_0_0_0_0_0_2_0_0_0_0_0_0_0 CTAGGTACATCCACACACAGCAGCGCATTATGTATTTATTGGATTTATTT >R82_0_0_0_2_0_0_1_0_0_0_0_0_0_0 ATTAACTGGTAAGATACAAATAGGTAGTTTTAGAGGAGGGAAAAGATTGA >R83_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTTGTCATCAAGAAACAGATTTTGTCGCCTTCTCTGTTAGGGAGGGCGGT >R84_0_0_0_0_0_0_0_0_2_0_0_0_0_0 ACTAGGCATAAAGGGATTAGTAATAACTTCGTAACGTGATATAGTGCTCG >R85_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TATTACTTCGTTTAAAACAAAAGTAGTATCCTGTTCCCATTTTTGAACTA >R86_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGCGCTGCTGAAAGTGCTGTCGAATCCGGATCGATTGCTGATGATGTGC >R87_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AGGTTTTGATGTTTATACCTATGATCACCGTGGTCAAGGACGGTCAGAAC >R88_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGCGACGGCAACGCCGGCGTGAAGCGGTCGCAAACTGTCTCTTATACACA >R89_0_0_0_1_0_0_0_2_1_0_0_0_0_0 AAAAGCGAAATCCATTCATATCGAAACAGAGGAAGAAAAAGAAGTAGATA >R90_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AATGTAATTGGCGTAATTATGACCGAACAAATGTTGATCGGGGTATTTGC >R91_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GGATCAATATCCGAGGTATCGAAGGAAACCGCATCAAGGTTATCGTTGAC >R92_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TGAAGATGGAAAGATTACGAACATATTACCTGGAATTGTATCAGAGCAAG >R93_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TCGGTTTTATCCAGTGTCAGTGACACGCTGATTTCTGATGTGGTGATGAG >R94_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TAACAGTCTTCTACTTTTAGTTCTAGGTTTTCAGCTTTAAACTCTAAGAC >R95_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GATTCTTTATATGAGTCATTCCATTGCAAAGCGAGCTCTACTTGAATATC >R96_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TAAAAAGTCTAATGATAATGTTGTAAATAGCCAAACGCAAGCAATGATAA >R97_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AGCATCGTGTTCGACGTCGACCATTTCAAGTATTCGCGCTTCACGATGCG >R98_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TCTTTTGATTGTGCGGTCATTAAACCCATCACTATATAAAACTGACTCTT >R99_0_0_0_0_0_0_0_1_0_0_0_0_0_0 ATACAAGTAAGTTAAAATTCGGTCACCGTGGTTTAAACCATCCAGTAAAA >R100_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TATCGTAAACGATCTTCAGCGTTTTCATCTTTATTTTGCTGTAATTCCGC >R101_0_0_0_1_0_0_1_0_0_0_0_0_0_0 CGTATGATTTTCCAAGGTTTAGAGTTTACAGGCGAGCGTCCATTTAAAGA >R102_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTTATCCAAGCCGGTTACGGGATTACCTTATGGGTAGTCATTACACTGAT >R103_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ATAAAAATGTTTCGGCCCGCCGCGATCGAGCCGATTTCCGGCGCGGATCA >R104_1_0_0_0_0_0_0_0_0_0_0_0_1_1 AGTCATTTTTTAAGCATGAAAAATTCATATAAAACGGCTTTGAAAATCCA >R105_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AGGCCGCCCGTCGAGCCGGAGCTGCCGCTGCCGCCCGAACCCGAGCCGCC >R106_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GTATTGCAAACTTAAACCACCATTTCCAACCTTTTAAATGGAATGATTTT >R107_0_0_0_0_0_1_1_0_0_0_0_0_0_0 TAATACACGTCAGTGCAATGTACCAAGCGGTCAGTTATATTGGAACATAG >R108_0_0_0_0_0_0_0_0_0_0_1_1_0_0 CCGCGTAGTGCGCGAACAGATCGGCCACCGTCTCGCCCGTCACGTCCGGC >R109_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ACTGTGTCGTCCGCGGCGCGTCGCGCCGCCCGCCGACTCAACGATTCCCG >R110_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CTTCATGGGCGAGCTGCGCACGATCGGCTGCCGCTTCGCTGTCTCTTATA >R111_0_0_0_0_0_0_0_0_0_0_0_0_0_2 GGGCATTTGTTGGCTAGTCTTATCTGTGAGACAGATTCTAGTGCAAAGTC >R112_0_1_2_0_0_0_0_0_0_0_0_0_0_0 TCCTGTCGTTAGCTCCCTATCTATTTTCTGCTGCACCACAAAATATAAAC >R113_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TACATGTAATCTATAAGGAGTGAGAAATTATGGCAGGGACATTAACGGGT >R114_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AATTCAGGGACAACAGGTAACTGACGCAACGCTTTGGCGAGACCATCAAA >R115_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TAAGGTAGCCAATATTTTTATCTTCAACAAACTCAGCGACTCCGGTAGCA >R116_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CTTCGGCAGTCTGTGCGTGATGGTCGAGGGGCGCTGCGCGCTGTCGTCGT >R117_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TGTTTAAATATATCTTTTGAAGCTGAAACAGGAACTGCTTTTACCTTTAA >R118_0_0_0_0_0_0_0_0_0_0_2_0_0_0 CGTGCGTGCGCGAGAGCATCGGCTGCTCGGCGTGCGCGTGCGCGAGCGCG >R119_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTTCTTCTTTATATTCTGTAAAAGGCCATTCTGTATCAGGATAACTTTCT >R120_0_0_0_0_0_0_0_0_0_0_2_0_0_0 GCCGTGCTCGCCCGTGCAGGTGCCGCCCATGCGCAGCGCGCGCTCGACGA >R121_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TTAGCTTTAGTTGCTCTTTAGAATCACTGTGGTTAAATCTCGACTCACAC >R122_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TGCGTAATTGAGAATGATAAAAAGAATTACATAGACCAGGAGCGAAGGGC >R123_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AAAGCCATTATATATTAAGTAATTCATCGCTTTTTGCTTAAACTTGAAAT >R124_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTTCATTGTATTGCAAGCTGTCGTCCAAAAGAAATTTCGTTATGTTGTAT >R125_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GTCAAAATTGGTAAGCAAATATTAGTAACCAGAGGAGCATTAACAACGTT >R126_1_0_0_0_0_0_0_0_0_0_0_0_0_1 GTGACTCGATCCGTGACAGTATTGATCGTATTGAATTTACCGATTTTCAG >R127_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AGATATGTGCATCCGTCTCTCGCGGAACGCGACGACCTGGTGCTGCCTGC >R128_1_0_0_0_0_0_0_0_0_0_0_0_1_0 GTGCCATTTCTCACCCGATTAATCAACGTAAGTACTATTTAACGCTGTTC >R129_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AACCCTCGATACTAACCAATCTTCAACTTCTTTAATCGTTCCTTCACAAA >R130_0_0_0_0_0_0_0_0_0_0_0_0_1_1 TTCATCATGCAGCTCAAACATCAACTGGTTGAGTTGTTGTAAATCTGCAC >R131_0_0_0_0_0_0_0_0_0_0_0_0_1_1 CGTTTGAATAATGCCGCCAAATTCGCTCGGCACTGTGTAGCCGACCGTAT >R132_0_0_0_0_0_0_0_0_0_0_1_1_0_0 TGCCAGGATTGCCGGAGGCATCGCGCCCGTCGCGATGAATACCCATGGAT >R133_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CGCGCTCGCGTTCCAGCCGCACCGCTTCACGACCGACTTCTGGGGCAACG >R134_2_0_0_0_0_0_0_0_0_0_0_0_0_1 AACCTTTAGTGAAGGTTACACCATTCAATGTCAGCAAATGATGGTTATTT >R135_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CCGCGAGCGTGAGCGCCGTGCCGTCGCGCAACTGCGGCACGACGACATGG >R136_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CTCGACAGCGCCGCGCGGTCCTCGCGCGGCAGATCGTGCTCGACGACGAT >R137_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AATGTACCGGATATGATTTTATATAACGGAAAAATTACTACTCTTGATCC >R138_2_0_0_0_0_0_0_0_0_0_0_0_0_0 AAGACCTTCGTCATCTTCTACGATTAAGACTTTGCTTTGAGCCATCTTCA >R139_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GCTTGACACCTTGTTCAGCATAGAATTTCTCAGTATCTAAATACTCTTGT >R140_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TATGACAGTTTGGAAGAGTCAATAAAAAAAGAATTTAAAGATAACTATGA >R141_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ATGTCGGAGTCCGAACGCACGCCCGGATAGCGGAACAGGTCCCACGTGCC >R142_0_0_0_0_0_0_0_0_0_0_0_0_0_1 ATTCATGCAGATAGATAGCCGCAATCACGCCTAAAGGCATGACGATGATC >R143_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TGGAGGATGCGCAGCAGCACGAGCAGGACGGGGGCCCAGACGCCGATCGT >R144_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CGCGAAGGGGTGAATATAAATGAGTAAAAAAGTGAAAAAAGATCATTCAN >R145_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TCTCCACTGTTTACGTCTACAAGTGTTACACTTCCTACTTTACCATTTGC >R146_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AAGCACTACGGCAGCATAGCCGTTAACCATGGAACAACTTGGGTTGGCGA >R147_0_0_0_0_0_1_0_0_2_0_0_0_0_0 TAGGCTAACACCTACTGATGTTTTGTTACATAGGGCAAAAGTTTCTGCCT >R148_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGCTTCGCTCATGAACGGCGCATGCGTCGATCGGCACCGGCGCTCGGCGC >R149_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AGGCGTATGATACGCCTACCTTTCAATTATGACACTTCAGTTTTGTTCTT >R150_1_0_0_0_0_0_0_0_0_0_0_0_2_1 ATTGGTCATAAAACGCGTTTCCCAACCTCAATACAATAATGACTGTTTTG >R151_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCGCCTCGCCGGCGACGGCCCGCTTCGCCGGCGCGTCGATCCAGCACGA >R152_0_0_3_0_0_0_0_0_0_0_0_0_0_0 ATTCCAAAATCAAAAATTATTCTCGAGAAGAATTCTAAAAACACTTATCA >R153_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TACAGTTGGGTTAAACCACATGGTTCGAAGCGTGACGGGACCATTATCAC >R154_0_1_1_0_0_0_0_0_0_0_0_0_0_0 ATAAGTTTATTGGCTTTCAGCTTAACTCAAGGCAAATGAGCCCAGCGATA >R155_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CTTAAACTGGAAAAGCTTAAAAAACTTCGTGAATTTAAAGATCAGGCAAC >R156_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ACGGCGCGCCGGCCAACACCTGTCTCTTATACACATCTCCGAGCCCACGA >R157_0_0_0_0_0_0_0_1_1_0_0_0_0_0 CCATATTTCATAGAATCAGGATGAACAAATGTCATTGTTCCGATTCCAGC >R158_0_1_1_0_0_0_0_0_0_0_0_0_0_0 AAAGGATCAAGCACTTGTATATATGGAGAGAGCTAATAGATTTAGACAAG >R159_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CATTCTTGATTCTCCACTGGGTTGGCAACCATACGCACTGGAAGCAGCAA >R160_0_0_0_0_0_0_0_0_0_0_0_0_0_1 ATTTACTCAAAACAAACAAGCTCGACGCGATCGAATGTTTGCCGATGCTT >R161_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TAATCCATTCATATGTTCAGCAATGTGACCAATTGTATCAGATCCTAAAT >R162_0_0_0_0_0_0_1_1_1_0_0_0_0_0 ACAAATTGGTAGGTTACTCCAACCTTCGCCTTCATATTGAGCTAATTGCT >R163_0_0_0_2_0_0_0_0_1_0_0_0_0_0 AGCATCACGAATATGCAGTTCATACAATATAGCATCTGTCATTGCTTGTA >R164_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AATTGATCGCGAACGCCGAGCCCGCGAGCAGCCCGATGCCGATCGTGCCG >R165_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TCGCCGCCGTGCTTGGCGCTAGACTCATGGATATTGCTTGGCCTTGGTTT >R166_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGCCGCGCCACGGGCTCAACTGCGCGGCGCGCGATCACCGAGCAGATAGT >R167_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AGAGAAGTGTCAAAATTACCGAGGTTTAAAGCATGGTGAGGCTGTTGGTG >R168_0_0_0_1_0_1_0_0_0_0_0_0_0_0 TGTCAAGGAAGTTCATATACACCGATTGCTAAAGATAAAAGTGTTATTAT >R169_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AAGCCGTTTGGCTCGGTATAACGCTTCGTCGGCGCGTGAAACGGTTTCCG >R170_0_0_0_0_0_0_0_0_0_0_1_2_0_0 AGGTCGGCCTGAAGCTGAACGGCAACCGGCTCGACGCGGCCGCGTTCGAG >R171_1_0_0_0_0_0_0_0_0_0_0_0_1_2 AAGATTCGTCCGGTTGATCTTACTAAGCAAGAGCAAGCACAGTATGTGTT >R172_2_0_0_0_0_0_0_0_0_0_0_0_0_0 GAAAAACGTCGCCTTACTTTGGAAAACCGTCAGCTAAAACGCAGTTTAAA >R173_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TCGAACTCGACGTCCGGCCCGAGCAGCGCGTGCACGCGCGGGATCACGCG >R174_0_0_0_1_0_0_0_1_0_0_0_0_0_0 GATATAGCTTCTAGGCTTGGGGATAATACACAAGCTAGTGGTAGAATTAA >R175_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CGTAATCACATCTAATGAATTCCCGCTTAAGCAAAAGAGGAGCTCAGTCG >R176_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AGCCACGAAAAGTGCTTCCGTCACTTCAGCTTATTTAAATCAATATTTTG >R177_0_0_0_0_0_1_0_0_1_0_0_0_0_0 AAAAGTGAAGAAACTAATTGCTATTATACTGGCCGGAGCATTAATTTGGG >R178_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGTCGGTCTTTTTCCGGTTCGCTATCTCGTCGGCACCGGCTTGCCCCGCG >R179_0_0_0_0_0_0_1_0_0_0_0_0_0_0 ATTTTTCATCATAATTCTCCCTATCCCTCTATTTTTATTAAGCTGATTTT >R180_0_2_0_0_0_0_0_0_0_0_0_0_0_0 TTCCATAACAGCCCTAACCTGTTCAAGGTTATTAACATTAAAAGCTGGTA >R181_0_0_0_0_0_1_0_0_0_0_0_0_0_0 GTAATAACCTCTCGGCAATCTTTTCCTTCTTCCATCATACGAAGCACGCC >R182_0_0_0_0_1_1_1_1_1_0_0_0_0_0 CTATTTCAGCACCAGATAAATCGCATTTACATCACCGTTTACTTGCAATG >R183_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TACTCGATGGGCTCGATGATCCGGTTGTGGTTCGTGTAGATGGACATTAA >R184_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CATTGTAGCAATAGGGAAACAACATAATATAAACAGAAAAAAAGTGTTGC >R185_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AACTAAACGAAAATATTCAATCTTAATAAGTTCTAATAAAATATTTTTCT >R186_1_0_0_0_0_0_0_0_0_0_0_0_0_1 AAATAATGGCACACTAACCGTATGTGTTTTGATTGCATAAGGTTGAGCTC >R187_1_0_0_0_0_0_0_0_0_0_0_0_1_0 CTGCAACAACTGGCGGTAAGCACAGCCAGTGCGATGCAAAAAAGCCAAGC >R188_0_0_0_0_0_0_0_0_0_1_1_0_0_0 CGCGCGCTCATGGAAAGATGAGCCCCTGCCGCGTCGCCTTCACGGCGGCG >R189_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CCGATGACGCGGATTTTCGATCTGTCGAAACAGTGACGCGCGGCGCCGCC >R190_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CAGCCCCATCATTTGCAGAGAATGCTGGTCCGCGCGCGTGGAATGCTGTC >R191_0_0_0_2_0_0_0_1_1_0_0_0_0_0 AAATGGTTCGAAATATTCGATTGTATATATTGCGAACAATATGTTTAATA >R192_0_0_0_0_1_1_0_0_0_0_0_0_0_0 TAACAGGATTTTTTAATGTTTCATTATATTTATCCTTCATAAAGCTTTCA >R193_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GTTCGTCGAGAAGACGGGCGCGTTGCTGCGCGCGCGGCCGATGAAAGGCA >R194_0_0_0_0_0_0_0_0_0_0_0_0_0_1 AAAGCAGTAGCGTGAATGACTTAAAGTGTGTGATTCATAGACATCCTTTC >R195_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGACGTGTTCGCGGTCGCGATGAAGAACGTGTCCGCGCGCGCGAGCAGCG >R196_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TGTTTGAACAAGAAGAGATTTCACGGTACGTCTTCTGCGCTGGAACCCAA >R197_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GCCCGAAACCTCGCGCAAAAACAAGGTCTTGCCGAGCTTGCCGTCGATGT >R198_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GATTACTGCGACTATACCATCTGTAATTCTTGCCCGCATTTCACTTTTAT >R199_0_0_0_0_0_0_0_0_0_0_0_0_0_2 TAAGGAACAACCACATTGCCCGGCAAGTTTAAGCTTGCTCCATCGTGCAC >R200_0_0_0_1_0_0_0_0_0_0_0_0_0_0 CATCTTAAACTTTGCTAGAAGCAAGGAAGTAATTTAACAGTCAGTGAAGG >R201_0_0_0_0_0_0_0_0_0_0_0_0_0_2 AGAACATTATTTTGGTGAGCCCCACCACTTTGCTGGTGGCGCTGCGCACC >R202_0_0_0_0_0_0_0_0_0_0_1_1_0_0 GAACCGCCCCAACCGAAGAGCTTCCCGTGAGCACACTCGATCTCGACGCG >R203_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CAACTAAAAACATAATGGCAGCAACTTCTGTTAAAGCGTGTTTGTGTNNN >R204_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AGAGAAAAATGTATTTTAAAAATTCAAACATGAAATATTGTTATTCAAAA >R205_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGGAAATTTAGATTCTAAGTCGGCAAAATCATTAATGAGCGCGTTGCANN >R206_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CCTATCGTTTTCATTAACTTACACCTACCTTACACTATTTTTTAAAGTTA >R207_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TTAGCTGGCATAATTACTTCATCTCCCGGCTGAATACCAATAGATAACAA >R208_0_0_0_0_0_1_1_0_0_0_0_0_0_0 TACTCCTAGAAGGATCAAGAATAATTCGATTAAAATATTTAGGCTTATTT >R209_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TATATGACTAAGGCGCCTTAAAGAATATTACGATACCATGATCTATTATT >R210_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATGAAAAGTTGAAATTATATGGGGTGTTTGCACCAGTAATTCCAGTTTTA >R211_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGAGCAAATGGTTGCAATTGAGCAATTACGCGTGCAGCCAGAATGGTTAT >R212_0_1_0_0_0_0_0_0_0_0_0_0_0_0 CTGCATAATACTGGTGGTATGCTGCTAACTTCTTGATTGTGAAAACTTGA >R213_1_0_0_0_0_0_0_0_0_0_0_0_1_0 CACTAGGCCCATTGAGCGAGCAGTACCTGCGATAGAACGCTTCATCGCTT >R214_0_0_0_0_0_1_1_0_0_0_0_0_0_0 AACAACAATGAAAGAAATTCGCCTTCAACACGTAAAAGTACAGCAAGAAA >R215_0_0_0_0_0_0_0_0_2_0_0_0_0_0 CTGTGTGAGCATTTAAAAACGCTGCAAAGCCATCAATTTTTCGATATTTA >R216_0_0_0_0_2_0_0_0_0_0_0_0_0_0 GTATGCAACCCATACAAATGAACAAGCTGGACTCGAAATGATTTTACAAG >R217_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CTGACGGGCGACCTCGAGAACGTGCGCTCGTACTACCTGAACCGCGGGTA >R218_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CGTATGATTTTCCAAGGTTTAGAGTTTACAGGCGAGCGTCCATTTAAANN >R219_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ACGAATGGAAAATAAGCAGAAGTCATATGCATCATCAGAAATGTCATCTG >R220_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ATATATCTTATAGATACCAAAAAACACAATCGCTGGAAGCAAATCATTAA >R221_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CATGAAAGAATGGCTGTTTTTATATCTTTAATGAATTTTATAAAAGGTAC >R222_1_0_0_0_0_0_0_0_0_0_0_0_1_0 GGGGTATGCCGTTAGTCCCAGCAATTCTAATAACTTAATCAGGAGCATAA >R223_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGGCTCGCCGATACGCTGCCCGCGCAGTGGGAAGGGCGCGACATCGTCGT >R224_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TAATCATTTCGAACGTTTGGTTTGTAATTGGGTTACTTGGGATATTCCAA >R225_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CGGATTGCTATGGCGATGCCAGAGCGAATTGCCACCAGTTTGGTGGGAGG >R226_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ACGCCGGCGGCGCGTCAGCGCTTCGCCGGCCGCTGGCAGAGCGCGCGACT >R227_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GTTGGCGATCAATGCACCGGCGGCGGCCGCCTGATCGGCCGCGCCCGATC >R228_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TACGTTTCGGATCTTTTACTTCTTCTGCTGAAGTTGCTAATATATCAAAA >R229_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GACACATGCCTTACAGCCAAGACACTTATCTAATGAGTCATAAACTTGGT >R230_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CTTTCTGTACCATGAAGTTTTCGTACCCTAATCCATGGGCAAATTTNNNN >R231_0_0_0_0_0_0_0_0_0_0_0_0_0_1 AATGAATTCGGGGCTGTTTTAATAACGGGATGAATTTCATGCAAGATCCA >R232_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GCCGGCCGTGGGCGCAGGCCACCACGACTGACATGCCGGCGCAGGAAGGC >R233_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CACCAAGTACATATTGCTTACCAACAATTTTCATTGCTTGTTTCATTGCT >R234_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TCATACTGCATCTCCTGACACGCTTCCCTGCTGAGAGACTTCGGGCTTCT >R235_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AAAACATCTTCTTCATGAACGAAATGTTTTTGAGCAACGTTTAAAGCTTG >R236_0_0_0_0_0_0_1_1_0_0_0_0_0_0 TATATTCCAAAAGAAGTTTTGGAGGGAGAAGATTTCCAAAAAGCTTTGAA >R237_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TAGCCGGTGATCGCGGTGTTGAACACGACTTCGCCGATCGTATGGCCGGC >R238_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AATTGTGTTTACGATAAAAACTTCACAGCCAAATCTTTCTGTAATTAATG >R239_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGGAACCGACGTAATTCATGCGAATTCATCATCGGACTCCGGATGCAGGA >R240_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AGAAGTAGTGAAAGACGGNTATAGACCGTTATGTCTAAAGAGAGGTGAAA >R241_0_0_0_0_1_0_0_1_0_0_0_0_0_0 TTTACTTCGCCGCAATAAAGAGAGAGCTTTAAATGCGAGCGAAAAACAAA >R242_0_0_0_0_2_1_0_0_1_0_0_0_0_0 TTCTTAAGAATAACTATTAATCGTACTGTTTTGAACGCTTCCTTTTTCTA >R243_3_0_0_0_0_0_0_0_0_0_0_0_1_1 ATTTGTCCCCGCAGGGTTTCCTTGTGGGTTAGTAAAGAGTAAGAAATGGC >R244_0_0_0_1_0_0_0_1_0_0_0_0_0_0 AAATGAGCAGGCCGAGAGTTTGAACATCTTCTAGGACGCTGAAAAACCCT >R245_0_0_0_1_0_3_0_0_0_0_0_0_0_0 TGTACAACGATATGCTGCATCGCTGCACCTAGAGCAATTTCCATTGCAAT >R246_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CACATTTGCCGGTTGAAACTTTCCAGAGGATCGTTCACCTGCGAATGAGG >R247_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TATATCTTTAGCTAGTTTAGTGGCTACTAACTTCCCAGGCTTCTCTTCTC >R248_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGGCGCACCGTCGTTCGAGCGCCGGAGCCGATCGACCAACGCCTCGCAAT >R249_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGGTACGCCAGTGCAGGATGATTTTGATGAAACGGACGGCATGCCCCGTG >R250_0_0_0_1_0_0_0_0_0_0_0_0_0_0 CCAATCATACCTATTAAAGGAAACAGCATAATCAAATTCAAGACTGTAAT >R251_0_2_0_0_0_0_0_0_0_0_0_0_0_0 TTGTATACTTGTAGTACTAGAGCATAATTTTGGGAGAGTGCTATGAGTGG >R252_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AAAAAACAACGGCTCAATAAACGACATACATTTCCCGTATGATGACGAGC >R253_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CGTATTCTGCTTGAGAAAGCAAAAGGCTCAAGCTGCACCAGCATGCACAA >R254_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GGATTGCAAAACTTCAGCGCGCATTTGCTCAACCATTGGCGTCAGCGTAT >R255_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CCGGCGCGCGAAGGCGGCGCGATCCGGCCGCGATTCGCGGAATCACGAGG >R256_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GCAGGAGAGAGTTGGTTAATCCGAACAACTGCAATTAAAGATACATTTTT >R257_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GAACGTCGTCTTCATCATCGTTTCTCCGAAAGCGGATGCGCCGCGCCGGG >R258_0_0_0_1_0_0_0_1_2_0_0_0_0_0 AATTACTTGTAGGGTTGACCAGAGTAGAAACCAAGCTTGATACACTCGGT >R259_0_0_0_0_0_2_0_0_1_0_0_0_0_0 GTAAAGATCCACTTTTTCATTTTATCACTACGTTCTGTAAATCGTAAATA >R260_0_0_0_0_0_0_0_0_0_3_0_0_0_0 ATCAGCGTCGTCATCGACCATAGCGCGAGCGCCATCGGCGCTTTCGCGCG >R261_0_1_1_0_0_0_0_0_0_0_0_0_0_0 TAACGGGCAAAAGATAGTTCTCAATCAACAGCAATTAGAAGCAGTAAATC >R262_0_0_2_0_0_0_0_0_0_0_0_0_0_0 TACAAAAGATGGTTATGAAGTCCTAACACTAAGAGAAGAAGAAAAAAACT >R263_1_0_0_0_0_0_0_0_0_0_0_0_1_0 CTCTAACGCCCATTTTTCTTGCACGTCAAGTAAGCGCTGCGCGACACCAT >R264_0_0_0_0_0_1_1_0_0_0_0_0_0_0 CGTTTCAGGAGAAGGGAATATCCAATGTTTTCTACCGTTCCATTCTACAT >R265_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TACAGAGTTTCTGCGTAAATGGTTTGGGGCAGCTCGACCCAGATAAAATA >R266_0_0_0_0_0_0_1_1_1_0_0_0_0_0 AACAAAGCGTATACGTGAAGCGGATTGGACAATTGCTAAATTGCCAAAAG >R267_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TAATGAAAGATTTCTCCGAACAATCTAAAGAAATAGACGGTATTGTAAAA >R268_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AACATATCAAGCAATTCACTTCGAACAACTGGATCTAATCCTGCTGTTGG >R269_0_0_0_0_0_0_0_0_1_0_0_0_0_0 CGAGTCCTTTCTCCATTCCAAATGAAGAGAAATGGGGGCCTGAATATGTA >R270_0_0_0_0_0_0_0_0_0_0_0_0_0_2 AGCTGTTGATAAATAAAGCCACGATCACGGATTTCGTATGGGTCATCGGG >R271_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGCACACGAAGGCGCCGCTGCACTTCCTGAACGCGGAAACGAGCCCGGCC >R272_1_0_0_0_0_0_0_0_0_0_0_0_2_0 GTGCATAGCGTTTTTCTATCTTTCAATAGAGGCTAGCGATCTAGTGAGGA >R273_0_0_0_2_0_0_0_1_0_0_0_0_0_0 CAAGGAATTGAGAGTCTAAAAGGTTTAGAGTATATGGAAAATCTAGAAAG >R274_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCACGCGGCGACCAAAAATTGGAACCCGGCGGCTAACGCCGGTTCCGTC >R275_0_0_0_1_0_1_1_0_0_0_0_0_0_0 AAGAAGACTATCATATTACCCTTTCATTTTTAGGTAGTGCGACAGAGGAA >R276_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GTGTAATAACAACCTCACTTGTAAATAGAAAAAGGTGTGTATATAAATGG >R277_0_2_0_0_0_0_0_0_0_0_0_0_0_0 GTACCAGTAGTAAGTACATTATTAGGGTTATCAGCATTTCCATACAATCA >R278_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TTAGGCGTGGTAGGACTAATTGCTGCGATTGGCTGGAAGCTTCTACATAC >R279_0_0_0_0_0_1_0_0_0_0_0_0_0_0 GAATACTTGTCTAATATCTGCAATCCATTCTTCAGCTCCATCTTTATCGT >R280_0_1_1_0_0_0_0_0_0_0_0_0_0_0 TAACTATCCCAATGTACACCATATGTATATCCCTTATGATGTAATTCCTT >R281_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCCGTACAGCCACGGATGGCCGCTCGCCCACAGTGCGCCGAGCAGGATGG >R282_2_0_0_0_0_0_0_0_0_0_0_0_0_0 CTTCAGCTACTTAACCGAAGAGTATGGTGTCGATCGAGAAAGCGCCTTTG >R283_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AGGAACGTTTGCAGAACCTGTTGGTGACTATAAAGAAATTCCGTTTTTCA >R284_0_0_0_0_0_0_0_1_0_0_0_0_0_0 CACAAAAGCAAGATCAAAAAATTGTTGGGTATTTTCCTTCATGGGGCATT >R285_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAACACGGGCTCCGTCGCGGTCACGGGCACGCCCTTGAAGCGCGCGCGCA >R286_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCTTTTAAGTCAATATATACTCTAGGATGTAAGTTCCAGTTTTCATGATA >R287_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TATCTGAGCGCATGACGCGCGCTTGTTCGATCGACGAGGTGACGATGAAA >R288_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AAGTGTGTGGGACATTACTAGCTGTTAATGTTGAGGCGTTGACATTATGT >R289_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TAATTAGAAAACCAAATATAGATATTATTAAAGAAGATATTNCCAATTTT >R290_0_1_2_0_0_0_0_0_0_0_0_0_0_0 TTGTATAGTGCCACACTGCCAGCTTCTACCAATTGCATCTTTGAGATGAA >R291_3_0_0_0_0_0_0_0_0_0_0_0_1_0 CCTAAGGGGCTGACAACGCATAACACTAAACTCAAACACAACAACCGAAA >R292_0_0_0_0_0_0_0_1_2_0_0_0_0_0 AGCCTGCGTTGTAAAATGCGTTTGATGACTTTCTCCGATAGCAAATACAT >R293_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GGTGTAGAATACATTGTCATCCCACTAACTGCAAAACCAAATACGTTATA >R294_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ATGCTCGGTTTGGGGGTGCTTTTTAGACGGATTAACCTGATCAATGAGAA >R295_0_0_0_0_0_0_0_0_0_0_0_0_2_0 GCGCATGCTAACAATACCCAAAGGTTTTCCGGTGAATATGGATATTGATT >R296_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TTTTTTCGCTTGGCTCATCAGGATTTTGTGTCGATTCGAAACACCCACAA >R297_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ACGATGATCCGGGCACGCCACCACGCTTGCGGCAACATGCGCCGTATCGA >R298_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAGGGCCTGCGCGCGCTCGCGCTTGCCGCCACGCTCGTGCTGCTCGCCGC >R299_0_0_1_0_0_0_0_0_0_0_0_0_0_0 ATAATATTATGATATCTAATCAACAACTAGATAGTGCTATACAAGATATT >R300_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAGCTGATAGACGACGGGCGCGCCCCGCTCGGTGCGCGGCGCGTCGGGCA >R301_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AGCGAAAACGAGGTCAGCTACTGTATCATCTAGCACGTATGGGGTATTCG >R302_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TCGAAGGCTCATCGTTATGTAGCAGCGGTTCAATGGCATCCAGAAATNNN >R303_0_0_0_0_0_0_0_0_0_0_0_2_0_0 GCTGATACATCACCGGATCGCCGCCGCCCGCCGCGTTGAAGAACGACGTG >R304_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ACGGCATCCAGCGTGACCGCTTCAAGTAGAAAAGGGAAATAAAAACATCA >R305_0_0_0_0_0_0_0_0_0_2_0_0_0_0 GTTGCCGTCCCAGATGTTGTAGTACGAGTTCATGTAATGCGTGCCGTAGC >R306_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TTTTGCAATTTTAAGTGGCTTCTTTGGTGCAGGACTTTTATTCGCTGGCT >R307_0_0_0_0_0_2_0_0_0_0_0_0_0_0 TCGTTGTGAGCATTGTATGGAAATATGTAAAGAAGAAGCACCAAATTTGA >R308_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GGGTCCAAAGTGCTATGGTCGCCAAACAAATTTTGTGATGTCAGCTTTGA >R309_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TGAAGCTGAACTGCATTATCGTAGAAGAATGCGTGAAGAAGCAGCAATTG >R310_0_1_1_0_0_0_0_0_0_0_0_0_0_0 TCTCAAGCTCTGGTAATAAATTAGCTTTCTCAAGGTATTGAGTTACAACT >R311_1_0_0_0_0_0_0_0_0_0_0_0_1_2 ATTGGTTAAGCGTATCGCTCATCATTTGATTGGTCGTCTTCCGCCCAGTG >R312_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TCTTGATCGCCGATGTATTGAGATCTTCAAGCGAGTGCAGAACGATTTCA >R313_0_0_0_1_0_0_0_1_0_0_0_0_0_0 CATTATACATTTCCTTTTTGGGTTTTAATGCTCATATTATAAATAGAACA >R314_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ACTTCAGAATACTAGTGTAGCCGCCTTGACGTGCAGCGAAACGTGGACCT >R315_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ATTCGGTCGGGCAGCCAGGCTTCCGCGTTGTGGCGGCTTGACAGGGCGAG >R316_0_0_0_0_0_0_0_2_1_0_0_0_0_0 AGCAAATACACGAACAATTTTCGGCATCGTTTCGGTAGGTACAAAGGCTG >R317_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTCCATTTTGCGTAGATACCTTTAATTCAGATAATGTAGTAGACCAAATT >R318_0_0_0_0_0_0_0_0_0_1_1_0_0_0 GGGCTTCACGCCGGCCGTGACCGCGCCGTGATAGCCGGTCGGCAGGATGT >R319_0_0_0_0_2_0_0_0_0_0_0_0_0_0 AGTGCAGGAATTGCAGCAAATAAGATAATGAATGTAGCAATTAAACGGTA >R320_0_2_2_0_0_0_0_0_0_0_0_0_0_0 CCTAAAAGTGGTGCTACACCAGCATTGAAACCATTGACTGATTCAGGGAC >R321_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TGCATTTTCAAGCGCTTTCAAATCATAATAATGATACGTTTTTCCATCTA >R322_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AAGAAATAGAGGTTTTCACAACTCGTCCAGATACTCTTATGNGAGCGAAT >R323_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGCTGTAGAGCGCGAAGCCGCGAAAGCGGCCCATCCGCGCGAGCACGAAG >R324_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GAAAGGTAAAAAATGATTGTGATTTACCAGCTCAAGATTATAAAGATATA >R325_0_0_0_0_0_0_0_0_0_0_0_0_1_1 CAGTGCCGAAACGCCAAAAGAGAGTAAAAGTTCGCGCTGAATGGAGTGAA >R326_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CATGTTCTTCTTTTATGTATAACACCATCATCCGAAACATTTGTAATGTA >R327_0_0_0_1_2_0_0_0_2_0_0_0_0_0 TTTAGATGAAATTTTGACTTTAACAAAAATGGGGATTTTTAGTGGTGATG >R328_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TGTAAACATATAGTCAATAGATAAGTGCTTATGTAAAACCCCTTTTATAC >R329_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CCTGTGTCGCCTGGTGATGAAATCCACATCTATCAAAGCCCTAATGTGCT >R330_0_0_0_0_0_0_0_1_0_0_0_0_0_0 ATCTCTTCGCCAGCTTTAACTTCCTTAATTTCTTTTCCAGCACTATCTAA >R331_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TGAGCCTTTACATCAACCGATGAAAGAACAGGCATTATCTCATTTTGATA >R332_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GTACACCACGCCAATCGATTTGACGTTGGGTAGGATTTCTTTAATCAGTT >R333_0_0_0_0_0_0_0_2_0_0_0_0_0_0 ATTAAGGTTCCATCCAAACTTACTTACAAGGGGCTGATTAAATAAACTCC >R334_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AATTCGTTTTCTTGTTTACTTAATTCTTCTTTAAATCTCGTAAATAATAA >R335_0_0_0_0_0_0_0_1_0_0_0_0_0_0 CCGTCACAATGAGAAGCGACCAACTCTCTATAGAGTATTTCAACGTTATG >R336_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AATAATATTACATATATTACAAAATGACCGCCTGTAATAGGCAGCTTTTT >R337_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGGTTCGTTAAAGTATCAGCTAAGTAGCCTAAATCAACTGGTAATGTGCG >R338_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATGTTTTAAACCACTTGTTACAATTTCAATTAACTCTTCTTCGTTATGGC >R339_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AAAAGGATATTTGTCACCATCTACAGAATACATGTTACTATCAAGATAAC >R340_0_0_1_0_0_0_0_0_0_0_0_0_0_0 ATGGACTACCAGATATTAGCTATCTAGTTATCTTCACTATCNGTGTAGTA >R341_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TTATATAGAACAGGGGTACTTTTCGTTTCAATCGGTCTCATATTAGCAAA >R342_0_0_0_0_0_0_0_0_0_1_0_0_0_0 ATGGCGTTCCGGTACTGGTGCCCCGACGGGCAGCCCGCGTGCACGGCCGG >R343_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCAAACGCATAATCAATATCTACAGAAATTTCTTTGATAGCCAATTTTTT >R344_2_0_0_0_0_0_0_0_0_0_0_0_0_2 GAATCTTAGCCAGCTTGGTAAAAACATGGCGGATTTAAAAAACAAATTGG >R345_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TTTCCCGGGGAAAAAGGTTTAATTAAATTTAATTTTAATAAATTTAAAAA >R346_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATTTCTTTTTTATGCATAGTTTATTAAAAAATATAATTGTTAATTGTTTC >R347_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GAGTTTAGAGAAAGCAGTGTTATTTTATGAAAGGAATAATGGGTCATTGC >R348_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GCCAATATAAGGTAGGTGACGATATTTCTGCGCGTAGTCGATACCGACAC >R349_0_0_0_0_0_0_2_0_0_0_0_0_0_0 TACTGCATCTAAAACGACTACAATTGATTTCACTTCTAAGAAAGGTGCTA >R350_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGAAGAACGTGTCGCCGTCGAAGCGGCCGTAATGGCCGTTCTGCGCGCGG >R351_0_0_0_0_1_0_0_1_0_0_0_0_0_0 ATATTCTTTCATTTAAAGAGGTGAAATAGATGCTACCAACAAAATTAAAA >R352_0_0_2_0_0_0_0_0_0_0_0_0_0_0 AAACTATGCGGTCCTTTTAGCTGTTGGAGTTGGCTTATCGGTAATAATTC >R353_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AGGCGTAATTGAACGAACAAAAGAGGGAAGAGAAAACTTATTAGAAGATG >R354_0_0_4_0_0_0_0_0_0_0_0_0_0_0 TCTCAACTTGGTAACGACTGTAGTGTCATAGAATTTGGCGCTGGTAATGG >R355_0_0_0_1_2_1_0_2_9_0_0_0_0_0 CCTCCGTTACACTTTAGGAGGCGACCGCCCCAGTCAAACTGCCCACCTGA >R356_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ATCAAGGACATCATCGATGGCGTGTACAACGCCGACGAGGCGCGCGCCGA >R357_0_0_0_0_0_0_1_0_0_0_0_0_0_0 ATATTACAGATAAAGCAAAAGAGTTTATTGAAACTGCTATGAAAGAAAAT >R358_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CGAGCAAGTCTTTGACATCATCAGGCTTACTCGCAAAAACGGTGATGGGC >R359_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTATGGATGCATCAAGGAATAGTACCGAAACTAGTGTTTTCTCATTCAGA >R360_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TGAATTTGGTTATCAGTTTGAGCGTATGGGCTATTTCTGTGCCGATAACA >R361_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TAAGGAATCGGAATATTTTCCCTTGTTCTATACGAAGGTCACCTGTCATA >R362_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CGTAAAACTAAAACCCCTAGCAGCATTATCTAGTTGCGGTGNAGAAACCC >R363_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CATACCTTTATCTTCTAACATCATTTTCATTTTTTGATTAAATTGTAATC >R364_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ACGTTAAAGCACTCTCAAAGGACGAAGGCATCCACGCCTGGCGCCAGAGC >R365_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CAAATAAAGGTTACTTCTGGTTAGCTGCCAGAGCGGCTTCAATCAGATCA >R366_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CAAATAAAGGTTACTTCTGGTTAGCTGCCAGAGCGGCTTCAATCAGATCG >R367_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TTCGCGGCCGAGGTCCACCACACGTCGTTGCCGAACAGGTCGGAAGAGCT >R368_0_0_0_0_0_0_0_0_0_1_0_0_0_0 ACAGACCTCCTCATGATTCATCTCGTCACGCACAACCGAGAAGAAACACT >R369_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGCCACACGTTCGCGCACGGTCGCGCCGGCGTCCCGCGAGCGCACGTCGA >R370_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AAATGCAGGTATCTCTAGAAAGAGTGAGAAGAGCATTGCAATAGCGGCAT >R371_0_1_2_0_0_0_0_0_0_0_0_0_0_0 ACCATTTAGCTCACTCATTATAGAATGTATTCTAGAACCTCTCACACCAA >R372_0_0_0_0_0_0_0_0_1_0_0_0_0_0 CCCGTTACGCAAATCATGGGTCCGGTTGTAGACGTTAAGTTTGATGGCGG >R373_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CTAGTAAGTCGGATAGCTCTTCGAGTTTATCGGTTTTTGTGTTCGCTTCN >R374_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ACGTGCTGTGAAAGAGCGAGCGCGAATCGTGCTCGCTCGAGTAGCGCACC >R375_0_0_0_0_3_0_0_0_0_0_0_0_0_0 TTTGCTCTATTGAATTTACTGGAAGTTATCAAAAGTGTAGACCAAAGTTT >R376_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCCGGGCGGCGGCACATCGATGGATGCGTCGCCGAGGCGCCTGAGGGTTG >R377_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AGCATATTAGAATGCGCATCACTTGTTTCATTATTATCATCGGTTAGAAA >R378_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGCGCTGAACTTCCTGCAACTGCTGTCGGCGCGCGCCCGCGGGACGCCGC >R379_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCGCGGGGCTCGACGTGCCGATCTGGCTGCTCGGCTCGAGCCTGTTCAGC >R380_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTACGCAGGGTAGCTGTACGAATGAAAATATCGGGATGAAAAAAGCTCTA >R381_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ATGAAAAGCTTGTCGAGATCGCCGAGCGTCAGTTGATACCAGGTCGGCCG >R382_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AACAGGGAAAGAAATTGATATAAGAAATTTACCACTTCAAGATGCAAAGA >R383_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAACGCCACCACGCCGCTCGCGGGCGACGTCGGCTCGTCGATGCCGATCG >R384_0_0_0_1_0_0_0_1_0_0_0_0_0_0 ATGCTTGTTCATAATAGTAGTATAATAGTGAATGAGGTGTTAATAGAATG >R385_0_0_0_1_0_1_0_0_1_0_0_0_0_0 CAAACATACACCGAAAGAAGAAGCAACAAAAGAATACAGACAATTACTGC >R386_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GCCATCGCCGCTACAAACGACTCCATTAACATTGCTCCATAACCNNNNNN >R387_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TAATGGCGATTTCAACTGCGATTATCGCCTTTACTCCAAGCNATCAGCAA >R388_0_1_1_0_0_0_0_0_0_0_0_0_0_0 AGTATGATCAAACATTGTCTGATTTCCAAGCTTTTCAGTAACTGTTCCCT >R389_0_0_0_1_0_0_0_0_1_0_0_0_0_0 TACAGCCTGTTCCTTTGTACTTGTAAAACAAAAGCTAGGGCATTAGTATA >R390_0_0_0_0_0_1_1_1_2_0_0_0_0_0 TAGAAGCAATAAATTCATTTTTCATCTGTTCCGCTTTTTCTATTTTATCA >R391_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGCCGATGCTCGCGAAGCTGTGCATGCGCAGCACGCCCGCCGGGCGTTCG >R392_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TGCGAAATCTAACAACACTTGTCCAACTACACAAATAGCGCCTCCTACAA >R393_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CATTATTTGGAGCGAAATAGCTCAAAAATCCTAAGTCTGCAGAATCTCGT >R394_0_0_0_0_0_0_2_0_0_0_0_0_0_0 CTAAAAGCATGAGGGACAGCAATTGTGGATCCCATCCCTAAGTCTTTTCG >R395_0_0_0_0_0_0_0_2_0_0_0_0_0_0 TTAATATGAATTTTCGTAATCAAACTCCACCCAATTTTTCCAGTGCGTAT >R396_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGACGAAGTGGTACTAAATTCATTACCATGCTCGGTGTATATATAGATGC >R397_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CAGCTTCAAAATATAGAGAAACCTATACCTAAAAAGAACGAAGTATTAGT >R398_0_0_2_0_0_0_0_0_0_0_0_0_0_0 TTGACTGCTCAAGCTCTGCTTTTAGCTCTTTTATAGTTGGCTCATCAGCT >R399_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GTCTTTGAAAAGACGCGCTGCAGCACCTGGGTGCTCGTTAGAGAAGCCGA >R400_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GCCTGGATTTCAGAAAGTGTAAATCTAGTTTGTAATTCGCCACTTGAATC >R401_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TCCTTTACTGGAAGTAGCGTAAGACCATTGTTAATAAGGCGTGTTACNNN >R402_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AGCCTGCTCGACTTCGTCTCTAACTCATTGTTCATCTGACTCAAGATCAA >R403_0_0_0_0_0_0_0_0_0_0_0_0_0_2 CCTTATCTATCCGAAAGAAGTCTTCGGTATGCTGTGGTCGGGTTACAAAC >R404_1_0_0_0_0_0_0_0_0_0_0_0_1_0 TTACGAAGCGAGTTTGTGGCATCGGGCCATCTACCGCGTCAACGATCAGC >R405_0_2_0_0_0_0_0_0_0_0_0_0_0_0 TAAATTCTAGTCAGATGGGCTTGTCATTAGAGGGAGTTGCTCTTGATACA >R406_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAGCGGCCGATGTTCCGCGGCGGGGCGGTGGTCGCGGGCAAGTTGATGAA >R407_0_0_0_1_0_1_0_0_1_0_0_0_0_0 AGAAGATTGCATCGCTTTTTCAATTTCAGTTCCTAAAGTAGAGGCTTCTC >R408_0_0_0_0_0_0_0_0_0_0_0_0_2_0 GGAAAACGCTTTGCCACTGAGCCCTGAGCGGATCCGCGCTATCGCTAAAC >R409_0_0_0_0_0_0_0_0_0_0_0_1_0_0 AGCTATGTGGTTCAATACAAATAAAGTCAGGCCCATTCTTCAGGACGAGG >R410_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GATTTGCTCACTTAGCCCAGCAGGCTCGGCAAACCGATTTACAGCGCTTT >R411_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CTTTAGCATAGTAGGCATAACAAGGTTAGGAACATCCGTTGTTACGACTC >R412_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AGTACAGTAGAATGGATTTGACGGTGTCTTAATTACTGGAAAGTAACACC >R413_0_0_3_0_0_0_0_0_0_0_0_0_0_0 ATATTTTTTAAAATAGTATTTTTTTTAAAAAAATGATCGATGAGCTATGA >R414_1_0_0_0_0_0_0_0_0_0_0_0_1_1 GGGCATTATTATCTTGTACCATGGGATTTAAACCCAGACGGCGACAACGC >R415_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGGCACGATTTCGCTGCACGTCGCACGGCCGTCGCAGGACGAGATCTCGC >R416_0_0_0_0_0_0_0_0_0_0_0_0_1_1 CTCTGCTTAATGATAAAAACCGCATGCTAGTAGAAATGGTTGAGTTTGGC >R417_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AAAACTTTAATAACGGAATGTAAGAGATATAAGGGGATGGGTTAGTTTGG >R418_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCATCGCGTGATGGAGATGGGCGCGGCCGCGCTGGTGCGCCTGCTCGAGC >R419_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AATGAGCACCTTTACGAAGGAAAAACTCAATAAATCCGCCTACACCTTTA >R420_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TCTCGTAGGAGAAGTGGCNGAAAAAGAGATTACGATTTTCGTCTCAACTC >R421_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TCGCTTCGCGCGGCGCGTGTGCGTGCGCGGGGACGTGCCCTACGGCGTCG >R422_0_0_0_0_0_0_0_1_1_0_0_0_0_0 TTATGTTTACGAATTTGTCGCTCTAGTTTATCAACTACTAAATCGATAGC >R423_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TGGATCCAAGCTTGTTCGGTTAACTGGGCCAGCTCTCGACTGAGAGTGGT >R424_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACTATCAAAAAAAGACTCNATTTTTGAAAATCCTCTTTTTATGTACGCTC >R425_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTTCAATATTGGCAGCATAAAGGAAAAGCGAAGAAACAAAGATTTGTTAC >R426_0_0_2_0_0_0_0_0_0_0_0_0_0_0 CTGAATAGAATTCACCAATTGAGTTATCACCACGCAAAACTACAGAAGGA >R427_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CGGCGCGCCGAGTTCCACGCGCGTTTCGATGCGCGTCGAGCACCGTACCC >R428_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CTTAGCTGACTAGAGCCAGGATTAATAGCAACTTTAGTGTTATTATCTGC >R429_0_0_0_0_0_0_0_0_0_1_3_0_0_0 CACGCGGCACGCGGCACGCGGCACGCGGCACGCGGCACGCGGCACGCGGC >R430_0_0_0_1_0_0_2_0_0_0_0_0_0_0 TACGGAGGTACACAATGCAAAAACAGATATGAATGAATTACGCCGAAATA >R431_0_0_0_1_0_0_0_1_0_0_0_0_0_0 TGCTTCAAAGTCTTCTGCACATGCGCAATCTTCCCATTCGCAATCACTTG >R432_0_0_0_0_0_2_0_0_0_0_0_0_0_0 TATAATCCAAAGCTCAAAAAAAAGAGACATTAAAAGTGTCTCCTCCATCA >R433_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TCTCTTCAAAAAAGTTTGATCCACCCTTAGTAAAGAAAACTNTTGGTATA >R434_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TATCTTATCACCACTATGATGGACTAGCTCTAGATAATGAAGGTAAGGCA >R435_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GGCGTTTATCAATTGGTGATTGAAGCGTGTGATGCCACTGGTTGTACTAA >R436_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AGGGACTATCTGGTAGAACAATCTCAACAATGGTGTGGGTCGATTGCCAA >R437_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGCTGCGCGTGCTGCAGCCGATCGTCGACGTCGGCCTCGAATACGTGAAG >R438_0_0_0_0_0_0_0_1_0_0_0_0_0_0 GTCCGTAATGGACGGATTGAATTACATCAACAGGTACTCCTTTCCCCTTA >R439_1_0_0_0_0_0_0_0_0_0_0_0_0_1 TGAATAACTTGCCAAATCGGCCCAAAGGCGGATTTAAAAACCGGTTACAA >R440_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CTATTATTAAATAGGAAGAACGTGAGCATCCCCGTCATTAAATTAATTTG >R441_0_0_0_0_0_0_0_1_1_0_0_0_0_0 ACGGTGTACGTAATGATATCGTCTATATCAACGTTGTTTCGATCAGCTGT >R442_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CCGAGTACTTTGTCATCGCGTTTTACCTGAGATAGGCGCACATATTGAAA >R443_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTAAATTAGATCTTTACTGAACATTTTAACTCCTTCTGAACCTAACGTAA >R444_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTCTACTTCGGTGTTCAAGATAATTCTTTACAAAATAGTGAACAAAAGTT >R445_0_0_0_0_0_0_0_0_0_1_0_0_0_0 AGTCGTCGACTTGCCAACGCCGCCCTTCGGGTTTCCCACTGCCAGAATCA >R446_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GAAGTTCGTCGGATCCCCGTGGATCGATACGTACAGCACGTCGCGCCGCG >R447_0_0_0_0_0_0_0_0_0_0_0_0_1_1 TCGTTTCTTGGCGATGCCGCAAAAGCATACCCAGCGAGGGAGAGGGATAT >R448_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TATTACTGAGGTGGAACATGGCACAAGCGCTGCAAGTGAGGACTTCACCT >R449_0_0_0_0_0_1_0_0_2_0_0_0_0_0 GTAATGGCTTTGTCGAAAATGCAATAATGCCGTCAGATGCAAATTTAATC >R450_0_0_0_0_0_0_0_0_0_0_1_1_0_0 GAGCCGTTTCTCGAAGGCGGGCTGCAGCTCGGCAACGTGCGCGGCGAGAT >R451_0_0_0_0_0_0_0_1_0_0_0_0_0_0 CGAGTTAGTTAGCCAAGAAAAAGTAAGGAGTACAAGGGAGACACCTTGTA >R452_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GTATACGAGATCGCGGTGCTGCGCGAGCCGGCGAGCCGCGGCGGCTCCGC >R453_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GATTAAAGGTTCATATGAAGTATTGTCTGGCATTAGTATTGTAACGTTAC >R454_0_0_0_0_0_0_1_1_1_0_0_0_0_0 TCTCCAATTTCATGACAAACTACATTTGCTTTCTTTTCAAAATAACCATG >R455_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TCAGCAGCGCGTCGATGTCGTACACCTTCGGGTTCCTGACTTCTCCCTGT >R456_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ATAGTTCAGGACTTGTTGTGGTGAAATAGCCGGGCTAACTAAATAACCTT >R457_1_0_0_0_0_0_0_0_0_0_0_0_0_1 AATGAGCCGCATCAGTATCTGGGCAGCTTTGATCGCCCGAACATTCGCTA >R458_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGCAGCGAAGGCGCGATGAAGGCGAAACGTAGCCGACGCACGGGGCGGC >R459_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TTTCAGCGAGATAAGTTTTGTGCAAGCTTCTGGAAAGAAACGAGACCTGT >R460_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATCAACTGGGCCTAATGCGGATGAAATATACGCATAGACTGAACCACAAA >R461_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTAGGATTAAACGATTCTGCACTTGAGTTTGAACCAGAAACATATCAAGC >R462_0_0_0_0_0_0_0_0_1_0_0_0_0_0 CTGATGCTACATTTTCATTACACGCTTCAATATAATGTTAGATTGCTTGT >R463_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AACCCCAAGCGCGATCACCCAGTAACGGATAAAAAACCGAGCGCCTTGAA >R464_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CAGCCTTTACCTGCGCAATCCGCCCCACCAATCAGCCAATCCATTGGGAT >R465_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ACAACCGCAAGCTGCTCGCCGACATCGAGCAGCTCGAGCACAAATCGCGC >R466_3_0_0_0_0_0_0_0_0_0_0_0_0_0 CACATTTACTCTGGCTACACCGTACCCGCGCATTACGACTCGATGATCGG >R467_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GAAATGAACCGATAACAAAGTGAAATACGAAGATAGCTTAAGAGTTTACT >R468_0_0_0_0_0_0_0_0_0_0_0_0_1_2 GAACTCACCTTTGCTGGCGTATTCGAGCAAGAGGGGCAGCGTGAAATCTT >R469_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGTTACGTTCGATGTCTATATATTTGTCGGAATGTTTTATTTAATATTAA >R470_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TCCACGATCTACGCCGCACCGGCTCGACGCTACTGAACGAAATCGGCTTC >R471_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CTGCTTATCAAACGCCATGGCTTGCTGTTCGGCGGGAACATCATCCACAC >R472_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTGTTGGAAATATTCTTCGGGATGCACTTCCTGTTATGGGAGTGAAACCG >R473_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GTGTTTCAATCATATGCATTATTTCCGAATTTAACAGCACTTGAAAACAT >R474_0_0_0_0_0_0_0_0_0_1_0_1_0_0 GCCGAATACGGCGCGAAGCTGACGACCACGGTCACGCTGTTCTTCGCGAT >R475_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CAGCGATTTGTGCGGAGCAATCAGTGCAAACTCTTCACCGCCATAACGAT >R476_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TTACGTTGTCTAATACTAGTGATGACCACATTAAGAAATCAAACACATAA >R477_0_0_0_0_0_0_0_0_0_0_0_2_0_0 TCACGCGCCCGAGAAACGCCGCGGGAAACGTCTTGAGCAATTCGGAAGCG >R478_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CAAACCCGCGCCCGCCGCGCCGCGCGCCGGGTCGGTTACTGCGGCGTCCG >R479_0_0_0_0_0_0_0_0_2_0_0_0_0_0 AGTTCTTCAAACACCTCTTCTATTTTTCGATCACCATAAATTTCTTTTAC >R480_0_0_0_0_0_0_0_0_0_1_0_1_0_0 AGCAGCCCGTCGAGGCCGACGTGATCGAATGCGGCGCTCGCCGCGCTGCG >R481_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TTAATGCTTGTTTATAAACATGATCAGCTACATCACCAGCTGCAAATACC >R482_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GAGTCGAACCCCTGTTACCGCCGTGAAAGGGCGGTGTCCTAGGCCTCTAG >R483_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AACACCGCGTCGTTCGGCTCGACGGGCGGCGCGGGGCGCTTTAACAACTG >R484_0_0_0_0_0_0_0_0_0_0_0_1_0_0 AGCTCGCGCTTGCCGCCCGGCCCGTGCCGGAACGTCGGCTNCGCGATGTC >R485_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GACCGTGATGCCGCACGGGGTGCTGTTTCGCGGTGGCGAGGAGAGAGCCA >R486_0_2_1_0_0_0_0_0_0_0_0_0_0_0 GAAGAAATACCTATAATTGAGCCAGCGATCTTTAGTTTAACTGCATTTGG >R487_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CAGCCAAACGATCTCTCGTTACAAGTAAATCTGATCCACCGCCGATGAAT >R488_0_0_0_0_0_0_0_0_2_0_0_0_0_0 CATACTGTATCCTGTTTTCTTTTATATGGCCTTAACAGATACGGAAAATC >R489_0_0_0_0_0_0_0_0_0_2_0_0_0_0 GATGGTCCGATGCAGGCCGAGGCTCGACGTCGTCGCGCCGACGTCGTACG >R490_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TATTACGAATATTATTGCGTAGACGGTGTGCAAAATGTTTTAACACCTGA >R491_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TTCACTACAATAGCCGCAGATGAGCTAAGCGTTGCGGTAACCATGTCTGA >R492_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TTCATAACAATGCGGCATGCGGATTTTAACAGGCGCCGCGGCGAGGTCCA >R493_0_0_0_1_0_0_0_1_0_0_0_0_0_0 TTGTTACAAGATCCACTTGCAACGACTTACCAGTTAAAAATCCAGGGTCG >R494_0_0_0_0_0_0_0_0_0_0_0_0_2_0 TCGACAAAAAAGCCAACACGCTTGATGAAGCGCTGGCGATGATCGCCGAT >R495_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CAATTGGTTTTGACGCTCCGCATACGGGCCTTCGCCCGCCCATGCCCAAG >R496_0_0_0_1_0_0_0_0_2_0_0_0_0_0 AGAATGTATTAGACGCATACTTTATCATTTCGGCACTTTGGATATCTGTT >R497_0_0_0_1_0_0_0_0_1_0_0_0_0_0 ATCGTGAATACCAAATGTTGCGTAACACTTCATTACGAATTATTCGTGCA >R498_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TGCCGATGCATCAGACTGGATCGCCACTACTGCTCGGAATCGAGCCTTTG >R499_0_0_0_0_0_0_1_0_1_0_0_0_0_0 CCAATTGTTTTAAGTTTATTGGGTCCGCTAAAGCAAGGTATTAGTGTAAA >R500_0_2_2_0_0_0_0_0_0_0_0_0_0_0 TAAATAAATCAGATATCCCTAGTTTCTTAAGAAGAAGATAATAAAAACCA >R501_0_0_0_0_0_0_0_0_0_0_0_4_0_0 AGTTCACCGCGCGGTTTTCGGGCAAGGCGCACAAGCTCGAGGTGCCGGTT >R502_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CGATGGTAATCGCAGAAGAAAAAGAAAAACATACATTGCGTGTGTTAATG >R503_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GGTGGTTTTCTTTTATGTAACGTTTCACTCATATATTTATTTGCCCCTTC >R504_0_0_0_0_0_0_2_0_0_0_0_0_0_0 CCGTTTCAATACGATATCCTCTAATTTTCACCTGATGATCAATTCGACCT >R505_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ATGCGGCTTTCGCTTGCCACTCGCTTGATTTTGTTGTTATAATTCTGTCT >R506_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TACTCGGAGCTGACGTGCAGTTGACCACTGAGCATTTCCACTAAACTGTG >R507_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AACTTATGAAGCGGAAAAAGAGCCATTTAATGGTAATGGCACTTGTTATA >R508_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCATCATAGAACTCTAACTTAGCTGCATGCAATAATAATCTATCAACTCC >R509_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AATACCAGAAGCATTTTGACGCATAAAACCTGCACGAAGTAATAACTNNN >R510_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CGTCTTCTGCTTGAAAAACCGAATCACCCGAGTTAACCACTACAGAGTAG >R511_0_0_2_0_0_0_0_0_0_0_0_0_0_0 AAATATGCCTAGTTGAGCTAATATCTTAGATAGCTAAATCAAGCGCTGTT >R512_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TGGCGGGCCGACAGGATGGCTCGTGCATTACGGCTACGACGACGACGGCC >R513_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TAAATAATTTTAATACCAAAACCATAGTAGTGCTGGCAATGATAATCTTG >R514_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CTCATGTCACTCTGCTCACCACCCAACCGGATGTGCCGGTCAGTGAAGTG >R515_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCGTCGTGCTTGCGCCTCTGTTCTCGATATTCGATACGGTGCTCGCCGCA >R516_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AAAAAGCAGCAACACAGGCTATTCAGGATTTATCAGTTAAANAGGGTGAA >R517_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TATTTGAGATTGTGACCAAAGATCACACAAAATATTTGGCAGAAAGAGTT >R518_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GGAGACGAAGCGGTGTTACAACCAGCTTCTACTGAAATTATCTTAAAACA >R519_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGGCTATTGGGGGTTACCGTCGGCCGACAGAACCGGCCGGCGGTACACGT >R520_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GTCATGATATTTTATTTTAATCTTACTACCCACTTGAATTTTTTTAAAAG >R521_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AGCACCGTTGATGATACCGTTGGTATATCCAGAGGGCACAAAAGCTACTG >R522_0_0_0_0_0_0_0_0_0_0_1_0_0_0 ACCAGTTCCTCGAGCATCGCCTTGCGGTTCTCGATCGTCTCGACCTCGTT >R523_0_0_0_1_0_1_1_0_0_0_0_0_0_0 TGTCGCACCTGATGAAACGTTTAGTTTTAATGGCCGCGTTGGCGTAACGG >R524_0_0_0_0_0_2_0_0_0_0_0_0_0_0 AAAGGAGATGTGCTATCAGGAATTGTTGTTGCTTTAGCGTTAATTCCTGA >R525_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGACTCGCCGCACGCGCGCTTCGGCATCGTCACGGGCGGCAAGGCGTATC >R526_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ATGAGCGCGCACAACTGCTTGGCGTGAATCTGAAAGGGGTGATGCCGGCG >R527_0_0_0_0_0_0_0_0_0_0_2_0_0_0 CGTCGCCCGGGGCGACCCGCTGCCCCTGCAGCGCGAGCCGCTGACCGATC >R528_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CTGGTGAAGATGGACCTGCGCCTGTTCGAAGCCGCCTACGACCTGGGCGC >R529_1_0_0_0_0_0_0_0_0_0_0_0_1_0 AGAAATCATACTCTCGCTGCTACATTAGGCAATCCACCCCAGATATATAG >R530_0_0_0_0_0_0_0_0_1_0_0_0_0_0 ATGAACTAATGCGCCGCTTCGGTTCTGATAATATGAAAGCAATGATGGAT >R531_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GAAAGTGCGTGCACAAGAGTTAGTTGATAANNTAAAAGAGCAAATGAAGA >R532_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CCCGCCGCGACTACGACCAGTACTATCGCGGCTTCTCGAATGCCACGCTG >R533_0_0_0_0_0_0_0_0_0_2_0_0_0_0 CGTGTTCGTGTACAAGGGGGCACCCATCGGCCGCATCTACAACCACGCAT >R534_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CCGATGTTTGGACTTATATGTCCAATCGGTAAACCGAATAGAACAGGTAT >R535_0_0_0_0_0_1_0_1_0_0_0_0_0_0 ATCAGCTTCAACTGCTGCATAGTCAATATCAGCGCGAAGTGTATGAAGTG >R536_0_0_0_0_0_0_0_0_0_0_0_3_0_0 CATCATCTACACGTCCGGCACGACGGGCAAACCAAAGGGCGCGCTGCACG >R537_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CTGTTTTTCACCTCAATTTTGATCGGTAAATCGCCAGTGATTCTGCTCAG >R538_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GTAATGTAAAATTTTATAAGTGGTTTGAGTCATGGAAAGACGTGAAAAAA >R539_0_0_0_0_0_0_0_0_0_0_0_1_0_0 AGATTTGTCATTGTGAGCATTTTCATCCCGAAGTTGCGGCGCATTCTGAT >R540_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GCTAGCTATAGTTGAATGGCAAGAACGATTATATCAAGAGCGGAATAAAA >R541_0_0_0_0_0_0_0_0_2_0_0_0_0_0 ATTTTGTACTATAAAAATCAGGATGAAGATCACTTGCAATTACAGAAGGA >R542_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TTTCTTCCGAAAGCTCTCGACCAATACATTCGTGCGAGAGATTCTAAATA >R543_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AAAATATCAAAATATCCAGACAGTAATAACAAAAATATACATAAATACTG >R544_0_0_0_0_0_0_0_2_0_0_0_0_0_0 TTCTCAATTAAGCGATACGTATGGAATATTATATGCAAGATGTAGCAAGG >R545_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TTTTGTATTGCTGGAACCAACCTATCTATAGCATTAGCAAATTTTGCTTC >R546_1_0_0_0_0_0_0_0_0_0_0_0_0_1 AATACGTTTGCAGCTAACTCTTTATCATCCAAGTTTTCTGCGCTCGTTAG >R547_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AATCTTTTAAGATTTCAATTTCTTTTTCTATAAGCTCTTTATTTTCTAAT >R548_0_0_0_0_0_0_0_0_0_0_0_0_2_0 CTGGTGCACTGTCGATCGTCGATCCTGAAGTCAATGTGGACGATCTTTCC >R549_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AGTTATTCTAAATTGTATCGGTGGTATGCCGGCAACAAAAGNTTTAGCAG >R550_0_0_0_0_0_0_0_0_2_0_0_0_0_0 GGTTACAAAGGAAGGAGCATTTTGGGAACGAGATTGTTATCAGTTTTCCA >R551_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTTTCTTGCTTAGACAATTCTCGTTCTTCCAATAAATCCGGTCTACGTGT >R552_0_3_0_0_0_0_0_0_0_0_0_0_0_0 ATTAGCAATATCTTGTTGTTTAGTCAAATCGGCTTTGATAAATTTTAGGT >R553_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GTCGGATCGAACGCAGTGGGAAGCGACGAAAAGCGTCTGATAACAAAGCA >R554_3_0_0_0_0_0_0_0_0_0_0_0_0_0 GGTAGCGATCTTCATACTCTTTGTCACGAACTCGGCGCTGGCTACGATCG >R555_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GTCGGTGCTGCCGATCGGCGTCTTCACGTAGGCGATCGTCGCCTGGTGCT >R556_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AACACTCTTTGAGCATTTTCAAGGTCAAGACGTTGAAACCCAACTGGAAG >R557_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GGGCCATTTTACGGTCACTTCATACATTGAACCCATACACGCCGATTTGA >R558_0_0_0_1_0_0_0_0_1_0_0_0_0_0 TATAACCTGATAATGTCGGTCCAATAGCTGGGGCTGTAATCATAACTAGT >R559_0_0_0_0_0_0_0_0_1_0_0_0_0_0 ACTATTAGCTATTATTGTGATGCCAATATTGTTACCTGCTTTAATAGGTT >R560_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CTGGCGCTGACCTACACGAGCCCCGGCCGGTTGCCCGACGGCGTGCGTGA >R561_0_0_0_0_0_2_0_0_0_0_0_0_0_0 AATATAATGATATAGGTTTTAAATTGGGATGAGGATAATAAAATCTATAT >R562_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GCAGGCCTTTTAAGTCCAACTAGTGGTGATGTGCTCTATCGTGGTAAAAA >R563_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AACTATCTTTACAGTTAACTAAATTCGCTCCTTTGAAAGTTAGAGGATAT >R564_0_2_2_0_0_0_0_0_0_0_0_0_0_0 GGTATTATTGCGTTGCAATTATTAGTAGCCTTTGGTAGATTACCTCATAT >R565_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ATTACAGGCCTGCGATCATATGCTCAATCGCAGCAACGATTTCATCGTCA >R566_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCATCGTAATACTTAAAGTTTTTAAATGCTTTAAATATTATNTCAATATT >R567_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CCCTACAGATTTTATATTGATTCAGCAGGGTTATTAAGTAGATATTATGC >R568_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TCTTCCTTTTTCTTGTATGTATTTGCGCTAATGGTTATAACGAACACCTT >R569_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATGGTTTAGACGAAAACGACTGGGATGGTCACAAATTATTAACTNNNNNN >R570_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGCCTCCGTCGCGCCGCCGAGCGCATGGAACGCGCATGCGCCGCCGCAAC >R571_0_0_0_0_2_0_0_0_0_0_0_0_0_0 TATGAAAGAAACCTTCCACAATTGTGGAAGGTTTCTTATTTTTCAATAAC >R572_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTTTACTCTATCGCACAAAAAAGTTGAAACATTTTTCCAGCGCCAACATA >R573_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ATATTCATAAGCTTCAAATTTTTCAGCTTGTAACACTGGGTTAAAAATTC >R574_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GATGTCATTGAATTAACGTTGTAAATTACTGCTGAAGATGGCTGAGAAAC >R575_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GTAGGAATTTTAGTCGTATTTACAAATGCTAGTTTAGCAATGGCATTATT >R576_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GTCCGGGATCGCGAGCGCGATCCGGCAGTACGTCGCGTTCNATGCCGCGT >R577_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TAACAAATAGCTCATGGATTACGAAGTTTGAGTTTGAGAAGAATGGTGCG >R578_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CGATGAAAATATTCGAATTACTTGCGATTAAAGTAATCCCAGATNNNNNN >R579_0_0_0_0_0_1_0_1_1_0_0_0_0_0 GTACGGTAAGTCTGATGTTGAATCAACTACTAAATAGTATTCTGGATCAA >R580_0_0_0_0_0_0_0_0_0_2_0_0_0_0 CGGACGCGGCGCGCGAGCTCGGCGTATCGCGGGTCACGCTCTATCGTCTG >R581_0_0_0_0_0_1_0_0_0_0_0_0_0_0 GGAAGCAATATGGAGGAACTACAACAAAATAAATCTGCTTTAGAAGGAAG >R582_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ACTAACGAGAAGCCTATTCCCCCTTGATCTGCTTGAGAAAATCAGGGTCG >R583_0_0_0_0_0_0_0_1_1_0_0_0_0_0 AAGAGGGCGATATATTTGTAGCGATTTCAACATCTGGTCGTACGAAAGAT >R584_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTCTGCAATTAAATTCGCAATCTCTCCAGATGATTCTCCTGATTGCTCCG >R585_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AAACCAGACACAGAAGCTCCAAGCATTCCAAATAGAATTCAGGCACAAAA >R586_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TTAAAAACTGGTTTTTAGAAGAATATAAAGAGCTATTTGAAGATCCTCAA >R587_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TGCCGCCTCGAAGCCGACGGCGTCCCGCGTGCGCGACGCAACCTGCCTGC >R588_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GTCAATTCCGTGATGGTCGGATTCGCAAGCGCGCTGAACGATCAGGACGC >R589_0_2_0_0_0_0_0_0_0_0_0_0_0_0 AAGCTGTTAAATATGTCAAATCAAATGCAATTGTCTATGCTAGAGATACC >R590_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TATCACTAGTTTTCATTTCTCTTGCATCTTGTTCTCTTTGTCTTAAGGCT >R591_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GTGTCTACTGCACCTTTACATACGGCTTCAGTGATACGTAGACGTGGGCT >R592_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTTTTTATGTATGTGTCTGTACCATCAGTGGAATATTCATTCCACTGATG >R593_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGACACGCGCCGCGGCACGCTCGAGATGTGCGTCAACGACCTGTTCCCG >R594_0_0_0_0_0_0_0_0_1_0_0_0_0_0 CTAATAAATCGCCTCATACGTGTAGGAAAGCACTCCTTAAATTCAAATTC >R595_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TATATGGATAGCCTTTGCCCGTTTTTACGCTCATTGCTTGATGAGGACTG >R596_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GGTTACTTAGATTTTTTTAATTCCTTGTTTGCTTTATCTATTAACTTAGA >R597_3_0_0_0_0_0_0_0_0_0_0_0_0_0 TGTACGACCTTCAGGAGTTTCTACTTGTGAAATTTCTTGCTTCTGCCCAC >R598_0_0_0_0_0_0_2_0_0_0_0_0_0_0 TTTCATCAATAGTAACCATTTTTTTTAATAGTTCAATTTGATATTTTAAT >R599_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGAGAGCGGCGAGCGCGTCGAGCGTCAGCACGTCCGAGCGCGGTGAGAAT >R600_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AGGCGAAGTTCTATTTAGAAAAAGTAGGTTTAAAAGAACATATGTATAAA >R601_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CGCCCACTGGTCAAGCGCGCGGCTCGTAAATTCGGGTCCCTGGTCGGTTC >R602_0_0_0_0_0_0_0_1_0_0_0_0_0_0 GCTCAAAAAGAATGGAGTGATGAAGAATTTTGGGAGGCAATCGAGTTACT >R603_0_0_0_2_0_1_1_1_0_0_0_0_0_0 GTAGCTGGTCTGCGATATAACCTTTTACCATTTCAAGTTCTTCTTCAGAC >R604_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CTAGATGTGGTGTTTACGTGGTGTGACGAAGATATAGTAGAGTGAAAAAN >R605_0_0_0_0_0_2_0_0_0_0_0_0_0_0 CAGGGGGATGAGGATTTTATGAAACAAAAATCTATGGATACGCTAGCTGC >R606_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CCCTGTAGGTAGCGTGAAAATTAACGAATCTTAAATCGGCGTAGTGTCTC >R607_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AAAGGTGTAATCTTAATACCTTTTTTCTCAGCAAAGGCTTTATTAGCATT >R608_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CTTCAACGCACATGTGGTCGTGCCACTCAACTATGTACAAATACAACAGA >R609_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TTGCTTCTTGCTGTTTTATTGCGGCTGCATCTTCATCTTTTTCCGTTTTT >R610_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTTCAAACCCTTTTTCTCCTACTAAAGCGACAAAAGCATCCTGTATGAGT >R611_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGATAGCTAGGCGTGCATTTCTTGCAAAGTCACCAGAACCACCGATACCG >R612_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCCAGATCACCGAATTCGTCGCGCGGACGATCTGGCGCTCCGGATGCTCG >R613_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AAGTCTGTGCAAAGACTAAAAGGTATTTATCAAACTGGCGCAAGTTATTT >R614_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGGTCGCGGTCGGCGACGCAAATATTGCACGGCGCGGCTGTGGGCACGTA >R615_0_0_0_0_0_0_0_0_0_1_0_0_0_0 ATGCGGCGACGCGAGCCGCGCAAAGCGGCGCTGCGCCGCGTTCGGGCGCG >R616_0_0_0_0_0_0_0_1_1_0_0_0_0_0 TTTGCACTTAAGTGAATATTCTTATCTGCTTTTTGATAATTCTTTTTATC >R617_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TAAGAAAAGCATGCAACAAGCCTTTAAGATCAGCAAAAGAAGCATCCTTA >R618_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGAAATAACGTAACGGGAAATGATAATTTGACTTAAAATACTTAATAATC >R619_0_0_0_0_0_0_0_0_0_0_0_2_0_0 TATTGGGCGGGCGTGGCGCTCGGCCACACGAATCCCGTCTCGCCCGGGCC >R620_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CTGCGCCCGCGACGCGACAGGTTCCGGATCGTCGTACGGCATGTCGACCA >R621_0_2_0_0_0_0_0_0_0_0_0_0_0_0 ATTTTCAGCAGTAAAATAAGTTTTATCGTATTTTTTTGTAGAGTAAAAAA >R622_0_0_0_0_0_0_1_0_0_0_0_0_0_0 ATATTCTTTTTATAGGGGGCTCGACGCATTATCCAAGCTAAGGTTTTGGA >R623_0_1_2_0_0_0_0_0_0_0_0_0_0_0 GCAAAATCTAATATAACATTTTCTGGATCATAATTTACATCAAATAAGCT >R624_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TATTACGTTCAAGCTGCAAAATGTCTAATTGGCCGTTTTCCGACCATTTA >R625_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AGCAATTACAGCAAGGTTTAGATATGTTAATCCTTATTTATAAGGATTTA >R626_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GGCGACGGGCTCGAAGCGATAGTTCGAACGGTTGATGTCGGGCGGCAGCA >R627_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GGAGTTTTGCTCTTTCAAGTCGCTTTGAGCAGTTTGGTGCCTTTACTTAT >R628_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GATGCATCAGCACGAAGTTGAGAATGCCGAGCGCCATCCCCGCGCAGCAG >R629_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AACGGTCAAGCTAAATCAGTGACATCGCCATTATCTTTAGTGATCTCAGG >R630_0_0_0_0_2_0_0_0_0_0_0_0_0_0 CTGTTTATTTTTTCTTGCAAAAGAGAGATACTACTTATTATTGCTCTACA >R631_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GCACATCAAGCGCCGACGTCGGCTCATCCAAAATCAACACCGGAGATCGC >R632_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GCGTCGGCGAGAAAGCGCAGATACGGCTCGCTGTGCACGGCCGCGAGCGG >R633_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GCTTGCCCTTTTTTAATGTCCTCGTGGTTAATTAAGCCTACGCACATTGC >R634_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCCTGGCCGATGCGCCGGCGCCCGCGCCCGTGTCCGCGCCGGTCGCCGCG >R635_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TTTGTAGCGTGATCGGCAGAGCAATCGCGATCAAGCGGCGGAAGAAATCC >R636_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GTACTTAGATTTCGATTCAATTCTTTTCGTTACATCTACTTTAGCAAGAT >R637_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTGGTACACTGAAACTAGTCTCTAGGAAAGGAAGGCTTTACATGATATAT >R638_0_0_0_0_0_0_0_0_0_1_0_0_0_0 AGCTGCGTGCCGAGACGCACGACTTCCGCGATGTCGGCAACCATCCGCTC >R639_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CGACACCTGTGGTTTGGATGCAAGCTTGACCATCGGCGTAATTCCATACT >R640_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CATAGGTTCAAAAGAAGCTTTGAAATATCTATTTAAATATTTCTTTAAAA >R641_4_0_0_0_0_0_0_0_0_0_0_0_2_0 GGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGAGTAGGGC >R642_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AGCGAAGCGTTCTATCAGGTGTACGGCATGACCGAGACGGGGCCCGCCGG >R643_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GGAGGAAGGTGGGGACGACGTCAAGTCATCATGGCCCTTACGAGTAGGGG >R644_1_0_0_0_0_0_0_0_0_0_0_0_1_1 ACTGGGCTTGGGTAAACACCCGCCGCAATCAGACCCGCAACGTGCGCCAT >R645_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGAGCATCAGCGCGAGCGTGATCCAGTTTTCGTTCAACTGCTGCGCGGC >R646_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AATTGCAATTCCACTTAGTATCTTAATTAACATCATCATCAGTCTTTTAG >R647_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TTCAGGCTCTTTCCAAAAGTATGCGACGAAGTTTATTGGACCAGGAACGG >R648_0_0_0_0_0_1_0_0_0_0_0_0_0_0 GGATGCGGAATTTATGCTGGCTTGTGTAGTTTACTGTTCGATGAATTTAA >R649_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GTAAGTATAAAGAAGTGCAAGAGGGGCTTCATAACCAACAGGAAGTAATT >R650_0_0_0_0_0_0_0_0_1_0_0_0_0_0 GTGTCATTCAAACACCCGAAATTAAATCCATATCACTTATCGTTATATTA >R651_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AAGTTACTTTTCGGTTTANCAGGGAATCCGTCAGCTTGTTATGTAGGATT >R652_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TACGGCAATCATGATGTGGTGGCCGATGCTAAATCCATTACCAGAATATC >R653_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TCCAGCAACTGGGAGAAGAGGCGTTTGATAGCGTGTTGCTGGATAGGTTA >R654_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CCGAACGTCGTCAACGCCGCGGACATCAACGAGCTGCCCGCGAACGGCCT >R655_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GAGCACTCGGAGAAACAATGCCACCTTCACCTTGCAGCGGCTCCATCATC >R656_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CTCGAATGCGTTTCTTCGCATGCGTGCCACGGCGGCGAGCAGCGCTTCTA >R657_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AATTTAGTTTTATCATTTTCTATTTTTTGTTGTGGAATCACCATACTGTA >R658_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCGCCTGTCGCCAATCGACTCAGTGTAAGAAAGCTAGCAGGAAATATGC >R659_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGCTTCCCGAACGGCTTCTCGACGACGATCTGGGTGCGCCCGACGGGCAG >R660_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTATCTCCACAATGGATTTACTTTATATAAGAAAGAACATCTTCAATATG >R661_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TCGTCCGGTAACTGGCGCAGCTTTTCGATAACACCGAGCGTCAAATGGAT >R662_3_0_0_0_0_0_0_0_0_0_0_0_1_0 AATCACAAAACCACTTTATCAACGCAATTCACAGGATTACCCACAGGTGC >R663_0_1_2_0_0_0_0_0_0_0_0_0_0_0 TTTAATCGTTGGGATTCTTTGCAACAAATAGCTACTAACATAATCTTAAA >R664_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GAAAAGATAAACTTGTCACCATTAAAAAAGATGGCGGTATTTCAGGCTTT >R665_0_0_0_0_0_2_0_0_0_0_0_0_0_0 TATCCATCCCACGATCTCTTAGTTTATCTAGACGACCACGGAGTGTTGTG >R666_0_0_0_0_2_0_0_0_0_0_0_0_0_0 TGAAATACATGCTTTACTTTTTCAGCTGGAATATTACTTCCGCCTCTACC >R667_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ATCGATCTGAGTAGGCGTGATAAAGATCATGGCGTCGGATCCCATCTCGA >R668_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TCCATTTCTTGTTTGACTTGATTATAGACTCTTATTTCATCAAATGTTCG >R669_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGCTACTTTCATACCCGACTTTGTTTCGTATTTGATGCCAAAACTACCTT >R670_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CAGGTCCAACTGGTATAACAGGCCCAACAGGGATAACTGGACCATCAGGA >R671_0_0_0_0_0_0_0_1_1_0_0_0_0_0 GTGATTCCAGCGTACTCTTGCTTCTTTCGCCCACGTATGGTCATCTTCTG >R672_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AGACATCGGAGTAATTCGTTCAAGTAACTGCCCATTCTTCCTTGTAGAGG >R673_2_0_0_0_0_0_0_0_0_0_0_0_0_0 ATAACGCCCCATTATTGGGGCGTTATTGCCTTCCTACTTGAAGCTGCAGC >R674_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGTGATATATCGGATGAAGAAATTGAACAAAAAGCACAAAGTTATATAAA >R675_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTGGGTCATGAAGAATCGAGTGAGCTCTTGCTACACCGAGTGAAAATGTT >R676_0_0_0_0_0_0_0_0_1_0_0_0_0_0 GACAGTTAACTACCTTTTCTATTTATAAATTTGGAATTTCCCAATCAATT >R677_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TGTGCTTCAATTCTACACAAAACAGCTGAGAAAGCATCTGAAGTTACACA >R678_0_0_0_1_0_0_0_1_0_0_0_0_0_0 TTGGTTTTGAAGTTTACTCGTAAAGTAAATTAAAACGTTACGGCAAAGTA >R679_0_0_0_0_3_1_1_1_1_0_0_0_0_0 TAACAAGCAAGTTCATGAAGAATAGGAGCAATTTTGTCATAGTGCTTCGT >R680_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ACGGTGCTGCGCGTCGTCAGCAGCGAGGCGAGCGGGCGCGGGCCGGGGCC >R681_0_0_0_0_0_1_0_0_0_0_0_0_0_0 AATTAATGTCGTATCAAGCGAAAGCTCTCGGTAAAAAAAACGTGTCAGTT >R682_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TTAAAGAGTACCGTAGAAGTATAAAAAGACTCCTATGAAAATAGGAGTCT >R683_1_0_0_0_0_0_0_0_0_0_0_0_1_1 AACGCTTACTGTCAAGACAACGACATCAGCTGGTTAAACTGGGAAAACAA >R684_0_0_0_0_0_0_0_2_2_0_0_0_0_0 AATCAAACGATATTTTACGTGATTATATGAAAACAATTGGTTACTAACTT >R685_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ATCGCACTCTGCCGCTTATGCGCTGGTTTCCTACCAAACCTTATGGTTGA >R686_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATACTTCGTAGTAGAAGAAAATTTCGTTACAAATTTATCACCGTTAACGT >R687_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATATGGCCAATCGAGATAAGGGGAGAGCAATAAAAGTAAATGGTGTACTT >R688_0_0_0_0_0_1_0_1_0_0_0_0_0_0 TGGCCGACACTTGAGAAGCTTAAAAAGAGTAAATTTTTGAGTTGGGTATA >R689_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CAATGTATAAGCTCGCTGCCATTCTAGCGACTTTTGCAGAGCCTATATTC >R690_0_0_0_0_0_0_0_0_0_0_0_3_0_0 CCGCCAAGAGCCATCGACGCGCCTAACAACATCATTTGTCCGGCGAAGGG >R691_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GGGAGAGAGAGCAGAAGCGAAACAACGGTTACGGTTAAAGATGGAAGTTT >R692_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CGCCGCGAGAGGTTAAGTAGAGTGCAAGAGCACGTGAACACGCAAGAACG >R693_0_0_0_0_0_0_0_3_1_0_0_0_0_0 ACCGAGAGATATAGTAAGCCTCTTTATCATGAATGGTTTGTAAATCTCCT >R694_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TGCTACTGCCTTCATATAGATGGAAAGACGGTCAATGACAACCAAGTAGT >R695_0_0_0_1_0_0_0_0_0_0_0_0_0_0 AATATGATTGTATATACAAATAGCACTAGGCTGCTAGAACGGATTGTTTC >R696_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AAACGGAATCAAATGTCCGATATGCATACTATCACCAGTCGGATCAACTC >R697_0_0_0_0_2_0_0_0_0_0_0_0_0_0 TCTATCTATCCCTTTCCTTATTTTATTGTATACGAAATCCCTATAATTCC >R698_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTGGGTCTCTCGGCATCGGCCAAATACAAAAAATCAGCACGTACCGTGGG >R699_1_0_0_0_0_0_0_0_0_0_0_0_1_0 CAACTGCGAGAGCAGTTAAATTTAAGGCGGGTATCTATAGCAAAAAGAAG >R700_0_0_0_0_0_0_0_2_1_0_0_0_0_0 AATACGTGACAAATCTTTACGATATAAATTAATTATATCTTTTAAAGCTG >R701_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TCTCATGAATTGCTTCATCAATTACACCTGCTGTACGATAAGCTGCACTT >R702_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GCAAGTTGGAATTAATAGCGCCTCCCAGAAAACATAATAAAGTATCGAAT >R703_1_0_0_0_0_0_0_0_0_0_0_0_1_1 TATCGTGTGTTACAAGAACCCGGAAGAATGTGGAAGCGTTATTTAATTAC >R704_0_0_0_2_0_0_0_1_1_0_0_0_0_0 ACATTGTGTTTGTTCCATTATTTCCGCTATTAAACTAGCATTTTCTAAAA >R705_0_0_0_0_3_0_0_0_0_0_0_0_0_0 TTCGGCTAATCTCTTACCTTCACCATAATTGAAGTCATTCCTATCTCCAT >R706_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CCAGTTTTTCAGAGAATATTTGTTGATGGTATTGCTAAGTTTATTGCGCC >R707_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGAGCACGCCGCGATAGCGCGCCGCCTGCACGTTCTTCACGAACTGGTCG >R708_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CTGGCATGTTGGTGCACCGTTCATGGCTCGACAAGCATGAAACCGAGTTT >R709_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCCCGCGTGCCCGGTTCGCATCCCTGGTTCGCATCCCTGGTTCGCATGC >R710_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AATTTTGGTGAAAGCTTATTTCGTGGCGGCGATGTGGTTTACTTGATTGT >R711_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CATGTTCCCCGCGGTGCACCCTTTTTAACTTTTCTAGCTCATCGATGTCA >R712_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TTGGTACGCTATTGTGCTGTTGGCACGATGAGAAAGTCTTCACGCGCGTG >R713_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGTGTCGTGCGTGAACGCGCTCTCGAGCTGGCTGCGCCTCATCGTGCGC >R714_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AACGCGCTGGCAATGCTACTCCAGTAATCCCCTTTACATCGTCATACGCT >R715_0_0_0_0_0_0_2_1_1_0_0_0_0_0 CATCAGTTGTAAAGCTAGATAAAACAGCTAGTTCAAGTGCATTATAAGCG >R716_1_0_0_0_0_0_0_0_0_0_0_0_0_1 ACCCCGCGTCCGTGTGTTATCGTTAAGCACGATAAGGGCTATGAAACTGG >R717_0_0_0_0_0_0_0_0_2_0_0_0_0_0 TTCATTCTCTAATCGATAGATTGATTCTACAATCGCTTTAAAAATAGGTG >R718_0_0_0_0_0_0_0_0_0_1_0_2_0_0 GGGACGGCGCGGCCGCGCGAGAGGCTCGGGCCGGCTTATTTCGAGACGAT >R719_0_0_1_0_0_0_0_0_0_0_0_0_0_0 CTGGTAATATCTATGTAAATAGGAATATTGTTGGTGCTGTTNTTGGTGTC >R720_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GAAAACATCGAACATTCCGGAGCACCCCAACTCATGTCCAACCTCTTGCA >R721_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GTTTATCGCAGCTTCTCCCTATGCGGAAAAAATCCAGCAGCACGTGAAAG >R722_0_0_0_0_0_0_0_0_2_0_0_0_0_0 GGAGAATGAAAATTGGTTACAACTTTAAATGTAACAAGTGTGGCCATAAC >R723_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AGCTGTCAAAGCACCTACATAACCACCAATTGGACCAGCCACCATTGTAG >R724_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GCGGCTTGGGCGGGAAGGGCGCCGAAACCATGCGTCGGGACGTCGTCGGC >R725_1_0_0_0_0_0_0_0_0_0_0_0_0_1 TGCGAAGCCGACACAAGGGTTACACCATGGTGCCCAAAAATCGACGACGA >R726_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATAGAGCTTTTACACCATTCAGAAAAAAGAAAAGTATAAGTTTAAATGAA >R727_1_0_0_0_0_0_0_0_0_0_0_0_0_0 AGTTCCTGACCATGACCCGTGATTCAAATACGGGTAAAGGCCAGTACAAC >R728_0_0_0_0_0_0_2_0_0_0_0_0_0_0 ATGAAGAAAATGGCATTATCCTTCGCGGTCGTAAGTTTATTACTAGGAGC >R729_0_3_0_0_0_0_0_0_0_0_0_0_0_0 AATTTGAACGCAAACTTATACAGGAAAGGACTATGGCTGGTTTATCAGCT >R730_0_0_0_0_0_0_0_0_2_0_0_0_0_0 ATAGGCTTTTTAACAAATGGATACACCATGAGGTAAATCTCAAAACCGGT >R731_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GAAGATACCCCCCAACGCCACGAGGTCGGCCGGGTCCATGCCGGCCACGT >R732_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACCCAAGTTCCTTACTGAACTGGAAAGTGTAAATTGGCATAAAGAAGACG >R733_0_0_0_0_0_1_2_0_0_0_0_0_0_0 AAGTGCATCATACACAGTTAAAAGTACATCATTTACATGGACACTCTGTT >R734_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AAACGAACATTTTTTGAGTGGTCGTATCAGAGTGTAACGATTGAGAGGAG >R735_0_0_0_0_0_0_0_1_0_0_0_0_0_0 CTTATACGTTTTAATATTTATGTTTTTATTTAGTTTTATCGGTCCAATCT >R736_0_0_0_0_0_1_2_0_0_0_0_0_0_0 TCTTGTAGGGAAAGTGATGAAAATGTATCCAGTTGAATCAGCAATTGTAA >R737_0_0_0_0_0_0_0_0_0_0_2_0_0_0 CGACCGACAGCGACGACGTGTTGTAGTAGCCGACCGTAGCGCCGCCGACG >R738_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TTTAAATCAGCTGCATTATGCACATCTGATAAAAGAATGATAAATGCTGT >R739_0_0_0_0_0_0_0_0_0_0_0_0_1_1 CGCAGTACCGATTCTGCGACTTTGCCTTGGAAGGATTCAGAATGGGTATC >R740_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AATCCTCATCAATTGATTGAAGGTATAGCTATTGCTGGATATGTTGTTGG >R741_0_0_0_0_0_0_0_0_0_1_1_0_0_0 CGAAGGGCTCGGCGCCGACGAGGGGCTGTTGCCGCTCACGTGGGCGAAGT >R742_0_3_0_0_0_0_0_0_0_0_0_0_0_0 AGACTCACAACAGCAAGCGGAACAAGAATTACAATATATAAACGAACTTA >R743_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTGTAGAGTTACCTAAAGACTTATCAGATGGGAAATGGCATCACTTTAAA >R744_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGGAAACCTTCTAAGCCATGATGCCCGCACGCGCCGCCTCTCGTCTCGAC >R745_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTTTGATGATTTGGATTTATTTTGTTGTATGCATCAATATGATCAACCTC >R746_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GTCAGCTAATGACTTCATAATGTTCGTTGGAACAATATTTACAAATGTAT >R747_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GCGCGATTGGAATCACAAGAGAGTAAGGGGCGTAAGAAGTTATCTGGGTC >R748_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CATTGTTACGCTACTTGTTATAAAAGTCCATTTACAACGTAACAGTGTTA >R749_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCGGGTTAATTCGGAATCCTTTTCGATGGGCGAAGCGAAGGCGTGGGCTC >R750_0_0_0_0_1_1_0_0_0_0_0_0_0_0 TTCACTTGATAAGGTAGTTCCGTTACGATAATAGATTGTTTGCCATTTGA >R751_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CAAGTTCTTTCACTGTAATTGCATTCATTAAATGATCTTGTGCATGCACT >R752_0_0_3_0_0_0_0_0_0_0_0_0_0_0 GGATGATAAATTTCTAGGAAATAGTATGGCTGATGTGATGTTGAATACTG >R753_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ATGTTGATGACGCCGATGAGGCCGTACGTGATCGCGAGGCCGAGCGCGGC >R754_0_3_0_0_0_0_0_0_0_0_0_0_0_0 ATAACAATATTAAGTACTACAATCTTAAGTTTTATTATCGGCTTAATTGT >R755_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CATGCAAAACATGCCCGGCACGATCCACTGGCGCACCGACGGCGGCGGCT >R756_0_0_0_0_0_1_1_0_0_0_0_0_0_0 TAATTGGTATATGAGTTTTTATAGGGATGTGGGAAAGTAAGAAGTTACTA >R757_0_0_0_1_0_0_0_4_2_0_0_0_0_0 GATAACAAAAGTGGACCCTGAATTAAGCTCGAAAGCAAAAGTGATAGGAT >R758_2_0_0_0_0_0_0_0_0_0_0_0_0_3 TAATTATATTATATATTTCATTTAAATTACTTTTTTCGATCTCCATAGCA >R759_0_0_0_0_0_0_0_0_0_0_0_0_0_2 AACCAAGGAATTTTATGTTTCTGCTTGCGATATATATCTCTGTCGCGATT >R760_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GCAGTTGATCGGCGACGCGCGCGAGTGGACGAGCTGCTGGACGATGGGGC >R761_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GATGTCGACGATCATCGACAGCACGGTCGGATGCAGATGGAAATGCTTGT >R762_0_0_0_1_0_0_0_0_1_0_0_0_0_0 AAGTCGATTACTTCATCAACTACTTCATCAGGACGAGCGAAGTCACGGTC >R763_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ATGGCCAGACTTGAGCAGTCTAAATGTAATGCCACCTCAAACTCCTGAGC >R764_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACAAACAAATGATGTAAACATAATGAACGATAATAAAGCTGCATTACTAA >R765_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TAACCAGACGATCAATACCAATACCTTGACCCGCTGTTGGCGGTAAGCCG >R766_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TAGCGGTTGCGATTTCAGAAAGTGCAATTGGTGCTAACGGCTTAGGTGCT >R767_0_0_0_0_1_0_0_2_0_0_0_0_0_0 TTATCCCAGCAGCGGGATTAGGCACAAGATTTTTACCCGCAACAAAAGCA >R768_2_0_0_0_0_0_0_0_0_0_0_0_1_1 TGAGATCTACATGTACAACATCGGTCTTACCTTTGAAAACATTAACTTGA >R769_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GTGCGCAGATGGACGCGCTCAACATCGCCGACAAGCCCGAGGATTTCATC >R770_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGAAGATGAAGGTCGGCCCGGGCACGGGCGAGCAGGTCGACATGGGGCC >R771_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ACATCAACCTGCAAATCTCACATTAGCGCAAATACAACAGATGATAGGAG >R772_0_0_3_0_0_0_0_0_0_0_0_0_0_0 CTCCAAATAAAGAAACGCTTATATTAAAACTTATTCCAAAACCAGTATTT >R773_0_0_0_0_0_0_0_0_0_0_2_0_0_0 GGAAAGCGCCGCTCGCATGCGGCGACGACGCGCGGCATCAGCCGGCACGC >R774_0_0_0_0_0_0_1_0_0_0_0_0_0_0 CTTCAAAAATAACAGTTCCATCTGCCTTCGCATAACCTCTTTCAAAATCT >R775_0_0_0_0_0_0_0_0_0_0_0_0_0_1 ATAGGATGCGCCGGAAAAGAAAATGGAGGCAGTGGAAGGTCTGTATAATG >R776_0_0_0_2_0_0_0_0_0_0_0_0_0_0 AAAACGCATTATTTCAAGCTACATATACATTTCAATATAACGGAGTATCA >R777_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CATCCTTACTTTTAGATAGTAACGTCAATTTATACGCTTTAACCAGAGAT >R778_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CTCGAAAGTTCGTATGCCGTCTTCTTCTTTAAGGAGAATTGTTGGAAATT >R779_0_0_0_1_0_0_0_1_0_0_0_0_0_0 AGAAAAAAACCTATCGCTAGGAGAAGCTATCGTACAATCTGGACACCAAG >R780_2_0_0_0_0_0_0_0_0_0_0_0_0_0 TCAGGAAACACTAAGCGCCTCTCGTCAACTTGATGAAAGCTTGCAGCAGA >R781_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTAATATATGCTCCTGTTACCGCATCCACTTTTTTCGTAATTAATGCTGG >R782_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGGCGGCCGAGCGGCTCGTCGCCGATTACGCGGGTGCGTACGTGCTGGAG >R783_0_0_0_0_2_0_0_2_0_0_0_0_0_0 ACTTTACCATTCGTGGAAGTTTTAGTTTGTTTTTAGGGATATATGGAACG >R784_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CAAGGTCTTGCGGATTGCGCCGTCGGGCTACCGACGCCATGCTGCGCAGT >R785_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AATGTCATATTAAAAGAAGCAAAAAGGCAATTTCCAAGAGAGGGATTTTC >R786_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GTTATAAAACCTTTTTTGATTACTCGGTTGCCAAAAAAGAGAAGATGACC >R787_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GAAATGGATTGTAAATCAACTTGAGGATGAGTCATATAATGGTCTTGAGT >R788_0_2_0_0_0_0_0_0_0_0_0_0_0_0 GATGTTGCATTAAATAGCTTGCAAATACTAGGTGTTAAGCCAGATAAGAT >R789_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AAAGAGCCTTCATCGCAAGAAGAGATGTTAATCAAACAGTTAGAGGAAAT >R790_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATAATACAATAAATATTGCTGAATTTAATTTAGGAGAACGTTTCCTTTTT >R791_0_0_0_2_0_0_0_1_2_0_0_0_0_0 AATTATTTTAATTTAAGCTATGTATTTTATTGCTTAAAATTAAGGAAGGA >R792_0_0_0_0_0_0_0_0_0_0_0_0_0_2 TCATGGATCGTGGCCGATTTGGAAGGCGATAATCCCGATCAGCAAGAGAA >R793_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TTATAAAAATCGTATTCAATCATTTCTCTTTTTTTCACATTTGCTTCATT >R794_0_0_0_1_0_0_0_0_1_0_0_0_0_0 CACAATTAACACAGACTGCAGTCATTGGACAAATCAATACATTACTTGAT >R795_0_1_2_0_0_0_0_0_0_0_0_0_0_0 ACTATTTTATAGGTGGTTTCTTCTTCAGTATCAACATTCATAATTGTAAC >R796_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AGGCGGCAAGTGAGTGACAAATTTGTCGGGAACAAATTTGCACAGCCGAA >R797_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GCTCGCGTCCCATCGGATGCCCTAAATACCCCTAGTAAGGAACAAGAACA >R798_0_0_0_0_0_0_0_0_1_0_0_0_0_0 ATTGATGTGATTTGGTTATCGCCAGTTTATGAATCTCCAAATGATGATAA >R799_0_0_0_1_0_1_1_0_0_0_0_0_0_0 GATTTCATGTCTCTACTCCAAGGAATTTTAACTCGACTTGTTAGTCTACA >R800_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ACGCTGAGTACGAGCCGATAATGCGCGCACTTCATCCGCCACAACGGCGA >R801_0_0_0_0_0_3_0_0_0_0_0_0_0_0 ATTGCTGTTTCTAAATTGCTCAAAATTAAAAAATATATTAATGCATTNNN >R802_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCCAGGGAGATGCGAGCAAGCTGCGCGCGAGTAGAGAGATTAGATAAGAT >R803_1_0_0_0_0_0_0_0_0_0_0_0_0_0 CGCGAGCGTAGCTGGCCAAAGCGATGCCACCCAGACTTAACGGAACATGG >R804_0_0_0_0_0_0_0_0_0_0_0_0_1_0 GGCAGCTTTTTATCGGCTTTGTAGCCAAACTCATTGAGCAGCGCTTGGAC >R805_0_0_0_0_0_0_0_0_0_0_1_0_0_0 AACTGGGACCCGGTCGACCAGACCGTGCTCGCGAACGAGCAGGTGATCGA >R806_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TCAGTGCGGTTTTTACTTCAGTGATGTAAACCGTCCCCACAAACACGTTG >R807_0_0_0_0_0_1_1_0_0_0_0_0_0_0 TAATCCGTGTTTTATTAAAATTACTTCATTCACACTAAACCCGTACTCTT >R808_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TGAGCAAGCTTGGCCACCTCTTGTTTGAGATAAGTCAGATTACGACTTAT >R809_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ACGCGGCATCAGATACTCCTGTTCTCCTGCCACCCGGAGAAATGGCGCGA >R810_0_0_0_1_0_0_0_1_0_0_0_0_0_0 ATTGTTGATTTAGAAATAGAATAGAAAGAAGCAGCATCTATTTGGATGCT >R811_0_0_0_0_0_0_0_0_0_1_0_0_0_0 AACGCGCTCGGCGAAGGCGCGACGTGGTGCGACGCCGCGCACGCGCTGTA >R812_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AAAGATACGAACGGAGATGGATTCCGTGAAGATCCGAATGGTAAAGAATT >R813_0_1_0_0_0_0_0_0_0_0_0_0_0_0 CTTCAAGTTGGTGGTGTAAATCTCTTGGACATAGGCACCCATACATAATA >R814_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TCCACGAACGCGCCTAAATAATATGATAATGCCTCTATATGATTGTTCAT >R815_0_0_2_0_0_0_0_0_0_0_0_0_0_0 AGATAATAATGTAATATTTTCTCAAGCAATGCTTAATACCCAGCAACAAA >R816_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TAGTTGATTCTGTAACGATTCCACATATGTTGCATGAATCCACTACGACG >R817_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TTGATAATTTTTGCTTCATATGATATACCAAAATTTTTAACACTCATAGC >R818_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TCTACGTCGTGAAGTTTCCATGAACATCAAGCGCCTAATGGATCTTGGTT >R819_0_0_0_0_0_0_0_5_4_0_0_0_0_0 CGTTCCCCTGCTATATCTGAATAAGGGTTACCTATATCAAGTTTGGGACC >R820_0_0_0_1_0_0_0_1_1_0_0_0_0_0 CTACAAGAATATTTTATATTCTTGATTTTTCTAATTTAAACGGTCTATAT >R821_0_0_0_0_0_0_0_0_0_0_0_0_0_2 CTGAAACACAACAATATTCTCAGGGCGGGGCGAAATTCCCCACCGGTGGT >R822_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCTGTTCGACCGGCTGGCGTCGTGCGCCGCGCGTCGCACGCTCGCCGGCC >R823_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTACGAATATTTCCTGTCTCTAAATATTCACGTAATTGACGCGCCGCCAT >R824_0_2_1_0_0_0_0_0_0_0_0_0_0_0 AACAACATTTGGATATGGTGCAAATTGCTGTTGATATGTTCTTAGGATAC >R825_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGCTGGCGAGATACCAGTCGGCGCGGGAGCCGTCCTTCACCGAAAACGCG >R826_0_1_1_0_0_0_0_0_0_0_0_0_0_0 TCTTATCAATAGTTTGCTTATAGCTATCAGAATTAAAAATAGCTGAACCA >R827_0_1_0_0_0_0_0_0_0_0_0_0_0_0 CAAGCTTTTGATAAGTATCATAGAGATTTTGCCACTGTTTTAATGCTAAA >R828_0_0_0_0_0_0_0_0_0_0_0_0_0_2 ATCAATAATCCATACCTTCTCTTGGTCATCAATCAAGATGTTATGAATAT >R829_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GCGTACGCCCGCGCGCGCGGCGGACCGCGCCGAAATGCGCCGACGTTCCC >R830_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCGCTGTTCTTCAAGGCGAACGTGCTGGCGTCGACATTCCGCCCGCACC >R831_1_0_0_0_0_0_0_0_0_0_0_0_0_2 CATCGAAGGGACAGGGCGAATTTCGTCGCGATTCACGCCGAGCTTACCCA >R832_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TTCATACTCAAACCAAACAAAAGGTAATACTGGAACGCTTGCTGGAATAA >R833_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ACCTAAAACCATATCATGCTGAGCTTGATGAAGATTCAATCTAGAGGTTG >R834_0_1_1_0_0_0_0_0_0_0_0_0_0_0 AAATAAGTTTAATCAAACATGTTACTAAAATAATTGCTAAGCCCCAGTTA >R835_0_0_0_0_0_1_1_2_0_0_0_0_0_0 AACATGATCACTGGTGCTGCTCAAATGGACGGCGGTATCTTAGTAGTATC >R836_1_0_0_0_0_0_0_0_0_0_0_0_1_0 ACAAGGCATCACAGGTTTACACTACAATCCGTTTACCGATACCTATCGTT >R837_1_0_0_0_0_0_0_0_0_0_0_0_1_0 AAGATCGAGCCAGAAGTCCATGTTTCCTCCAAAGTGTTGAAGACGAGTTA >R838_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCTCGACGCCGGACTCGTTCGGCGCGTTCGAGCAGGGCGCGCAGGAGGTG >R839_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GGAAAGAACCAAAACGGATTTCGTAATTATCAGCCGCACTGNCTGCTGAA >R840_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CAGGGCTCAACGCCATGAGTCGAGAGTTGGGCCTCCTTCGACTGCGCGGT >R841_0_0_0_1_0_0_0_0_0_0_0_0_0_0 CAACAGCCATTTTCGTTTCTAAACGATGCTTATTCGTTTGGATGAAGTTC >R842_0_0_0_0_0_1_0_0_2_0_0_0_0_0 ATTCACTGTAAAATGGCAAGCGAAAATCGAGAAGCTATGGATACAGTGGA >R843_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TATATTGCTGAACCAGTTCCAACATTTGTAGAAAACTATTTATCAGAACA >R844_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AACTGTAGTTTATTTAAATATGGCGCAGGAAGCTCACTAAGTTTAAACTA >R845_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGCTTTCGATGGAGCCGCCGAGCTGCTGCGGCAACGACGGCACGGCGGGG >R846_0_0_0_1_1_0_0_0_0_0_0_0_0_0 GCAAACCTAGAGAAACGTGTAGAATCAATGGGTATGCAAGATAAAATTTT >R847_0_1_1_0_0_0_0_0_0_0_0_0_0_0 AATTCATTATCTCCGAGTATATCAAGGGTGTAGAATATGCTGTTGGAACA >R848_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TGGTGGTGGACCAGTAGCCGGCGGAGATGAATTGTTTAAAAAGGTAATGG >R849_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CAGGTGCATGGCAATGGGAACCTGTCAACATCAAAGAGGAAGATAAACCG >R850_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ACGCTCAACCCGACCGGGGAAGCAATCAATGTCGTCGAATACTTGAAGCA >R851_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TCCCTTCACACTAAAATACGGCATTAATATATAATTTAAAGCTAACTTTA >R852_0_0_0_0_0_0_0_0_0_0_0_2_0_0 TTCGGGCACCTCGACCTTCTTGCCGTCTATTTCAAGTTCAACCATGATGG >R853_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GAAGTATTTACATGCATTAATCTCCTATGTTTCTCAGTTAAATTATATAC >R854_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GTGCATCGGCATGCATTCGAATCATTAATCGATTCTTCGAATGAATTTGC >R855_0_0_0_0_0_0_0_0_0_0_3_0_0_0 GGACTGGCGCGGCAGCGCCGCGGCGCGCACGGCGCCGGCGTCGCGCGGGC >R856_0_1_0_0_0_0_0_0_0_0_0_0_0_0 CTTTCTTTATATACATGACTATCAGAAGGTATATGGTTTAGAGTATTTGA >R857_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TGGCTGTACACTATCAATTTTATTCGGCAACGTATGTTGAGGCTCCCAAT >R858_0_0_1_0_0_0_0_0_0_0_0_0_0_0 ACCTTTTAAGGTTGAAAAAACTTTGAAAAACCATGCAACCCAAGGATTTG >R859_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTAATACCGCAAGAACCACTCATTTTTCCGCATATGACTATTGAAGAAAA >R860_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGACTGGCTCAAGCACATGAAGGCGCTCGGCAAGAAGCTCGTCGTGTGCT >R861_0_0_0_0_1_0_1_0_0_0_0_0_0_0 AGGTGAAGGATTGAATGCAAATTACTTAGCAGATTATTTAGAAGCGAAGT >R862_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ATTTGATAACTGAAAGCANTCGCTTCAACTACAATTGGATCATTGATATC >R863_0_0_0_0_0_0_0_0_0_1_1_0_0_0 TGCCCGTGGCGGCGCGTGCCCGTGTGCCCGCGCGTTCGCCGCGGCGGGGG >R864_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGGTGGACGACATTCTCGACGTCACCACCGATTCCGCGACGCTCGGCAAG >R865_0_0_0_0_0_0_0_0_0_0_0_0_0_2 TTAATGCAGAAAGAGTTCGAATCATGCCGCCAATGCTTGCAGGAGCCGAG >R866_0_0_0_0_0_0_0_0_0_1_1_0_0_0 GCTGCGGCGCGACTTCGTCACGTGCAGCAGCTCGAGCAGCCACGCGACGC >R867_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TTGCTTTCGCCGCCTTCCTTGCCGTCGGCGCCGTAGCTGAACACGTCGAT >R868_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TCGTCGCACGTCCCGACGACGACGTGACGCACGAGCGGCTTGCCGATCCC >R869_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTATTGCAATATCCAATCCATTAAATCTTGTTTTTTGGTTTGGTATATAT >R870_1_0_0_0_0_0_0_0_0_0_0_0_0_0 ATAGGGATAATTACATGGGGAAAGCAATGAACAAAATGGCTATAGCCCTC >R871_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GCGTTGGTGCCGCCTTTAGCACTACTCTGGATGGATCACGCAGAAAAAAG >R872_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GATTAGTTAAAGTTATCGAAGGACGGATTAGTTACTAAACAGGTGAATGG >R873_0_0_2_0_0_0_0_0_0_0_0_0_0_0 TAATGTGAACTAACCATAATTCTACTACCAGCAAATACCACTATGAGCAA >R874_0_0_0_0_0_0_0_1_1_0_0_0_0_0 AAGATGCTGATATGGCAAAAGAAATGTCTGAAATGACTAAATTCAAAATC >R875_0_0_0_0_0_1_1_0_0_0_0_0_0_0 CATGAAAGCAATGGGTGCTTTAGCTAATGCAGCAATCGCAAGTTTTCTTA >R876_0_0_0_0_0_0_0_0_0_0_0_0_0_1 ATACATTTTTCTTCCTGATCTCAGGAGCGCTCGTCATGTGGATGGCAGCA >R877_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ACTAGAGGGTGGTGATGAGGATCTTGCTAAAGATGTTGCTAAGCATGTTG >R878_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GACTGGTGAAGAATGGATTGCCACTATACCGATTGGTTATGCGGATGGCT >R879_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TCTTCTGCTTGAAAAAAACAACACAATACGAAAAATAATCGCTGTCATCA >R880_0_0_0_0_0_0_0_0_0_0_0_2_0_0 TAAGGGTTTATTGTCGGATGACAAGCCGCTTGGGACACGGCGACAATACC >R881_1_0_0_0_0_0_0_0_0_0_0_0_0_1 TATCACAAGCCAGTTTTGTGCTCTCCTTTATGCTCGTAACCAGTATGTTT >R882_0_0_0_0_0_0_1_1_0_0_0_0_0_0 TTTTTGAACAAATGGAGGGTAAATAAATGACTTGTTATGAAATGGGATCC >R883_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TAAGCGATGGAAGAGCTCGGCCAGAACCTGAGCGACTTGCTGGAAGAAGA >R884_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCCTAAATAAAACTAGAAGGGTAATATGCATTATTAGAACAATTATTAAT >R885_0_0_0_1_0_0_0_0_0_0_0_0_0_0 CTGAAGTATATGCTTGCTGTACACACCCAGTATTATCTGGTCCAGCAATT >R886_0_0_0_0_0_1_0_0_0_0_0_0_0_0 GCCATCTCATGAATTCGTTGCAAAATTTGTTGGTAAGGCAAATTGGCTTG >R887_0_0_1_0_0_0_0_0_0_0_0_0_0_0 GGCAATAGTAACTCCTTGCATCTTACATCCAAGGCTATTGCTGACATTTA >R888_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TTGTTTGTAAAGCACCCGATTAAAATTGATATTGCAGGGACGATCGAGTC >R889_1_0_0_0_0_0_0_0_0_0_0_0_0_0 GGCATTCCTGCTGGTAGGGCCAAGCGGTGTAGGTAAAACCGACACCGTAG >R890_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TTATTTTTCATTTCAGAAAGACGACGTTCTAACTCATCGATTTGCTCTAC >R891_0_0_0_0_0_1_1_0_0_0_0_0_0_0 CACTTTGCGCAGCCGCCTCACGATAAGCATCTACTGATCCTTTAAAGTTA >R892_0_0_0_1_0_2_0_1_0_0_0_0_0_0 TTAAAGGTTTTACAAGGAAAAGAAACTTCCACTCCAGCTGGAGCTGTTAC >R893_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CGAGCAGGCCGTGCTGTGCGGCGGCACCGTCGAGCTGATCAAGGCCGGTT >R894_0_0_0_0_0_1_1_1_0_0_0_0_0_0 GCTAGGAGAGAAAGATGTTCTGGCTAGGCTGGGTGGCGACGAATTTGTGT >R895_0_0_0_0_0_0_0_0_0_0_1_0_0_0 CGGATGTCGACCACGAGCTTTCCGCGGCCGATGCGTGGCGGATCGCGCGG >R896_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CACCTCGTCGAACGACAGGCCGGCGAAGTGCGCGTTGATGTAGTTCGACG >R897_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ATATGCTCAAAAGCATTATTTATCGCTGTAACATGTCTTTCACGTGCAGT >R898_0_0_0_0_0_0_0_0_0_0_2_0_0_0 AGCCACTCGCCGTTCATCGCGCACGCGGGCGCGGTAGCCGATACGCTCGC >R899_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AAGCCTTTTGGCGGCTTATTACGACCGCGAGTTTCTACGCGCACTCGAAC >R900_0_0_0_0_0_0_0_0_0_0_0_0_1_0 CTGATACATCATACAAATAGCAGCCCGCTGCACTGGCCAATGGAGCGAGG >R901_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TACTTATAGTAATGTCAACTTTCGCGGTGTTGCTAATGGTAATGCTAAGG >R902_0_0_0_0_0_0_0_0_0_2_0_0_0_0 CAAGCGGCGACGTGGAATCGATCTCGAAGGAAATCTTGCTGTCGGCCCCC >R903_0_0_0_0_0_0_0_0_0_0_0_1_0_0 CCGCGAGAGGTGTTCAAGCTCTATACGAGCGCCGAAGTCCACACAAAAAA >R904_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TAAACCGTACCTACCGATGCGGTTTCCAATAAAGTTTGGTGTGTCTTTTG >R905_0_1_0_0_0_0_0_0_0_0_0_0_0_0 GCTTTTGTAATTTTAGGATTTATAAACACCTGATATGGTACACTATCAAA >R906_0_1_0_0_0_0_0_0_0_0_0_0_0_0 TATTCTTGGTAAGCATGTTTTGAGCATTAGTAAGTCATTTTNTATGACCC >R907_0_0_0_2_0_1_1_0_0_0_0_0_0_0 AGATCAAGTGAAGATACAAGGGCGTAAAGAAGAGCTAGAAAAGATTTTAG >R908_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TTTGATTTTTCGGAAGAAAGGATAGAAAGTACTGCAAGTGTTATTTTGGA >R909_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTTTTACAAAATGATCGGCAGCCAAGACTAGCAATACGGGGTCATCCTCC >R910_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TGTACCACATTTATTATTTACTTTATGTCCATTTTGTCTAAAATAGAAAA >R911_0_0_0_0_0_1_1_0_0_0_0_0_0_0 TTTATTTATAAAACTCAACACTTCCAACATTTAAAATATTTTATTGTTAT >R912_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TAGAACTCGAATATTGGGTATTTTCTTGTTTACAAGCTGCTTCAGCAGGG >R913_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TTAACGGGAAAATCTTTTTATTCACTGCTCGCAATGACAATAACAAAGAT >R914_0_0_0_0_0_0_0_0_0_2_0_0_0_0 TGTCGTCGGCCGACACGCCGATCACCGTCGCACCGTACCGTTTGTAAGCG >R915_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGAGAAGCACAAGGTGCTCACCTATCCGCGTACCGACGCGCGCGCGCTGC >R916_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TCATGTAAAGTAAGTGAAGTACAAGATTTAATTGCAGTATATCAAAAACT >R917_0_0_0_0_1_0_0_0_0_0_0_0_0_0 GTAAGGTGGAAAAAGATAAAGATGCTTTTGATTTAGTGAAGGCTGTGTTC >R918_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TGAAACAGTTCACCGCGCTGCTCACGCCAGTCGCACCATTGCCAATCTTG >R919_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGAGCATGCCGACGATCGTGCTGCCGGCGGCCTTCACCGTGTCCGCGCC >R920_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AATCCTTTATTGAAGGAGAAAAGGCCATGATGCAGCCATTAAAGATGGAA >R921_0_0_0_0_0_0_1_0_0_0_0_0_0_0 ATTAAATTTGGACATGGAACTGAATCTCAACCTATTAACCTTGGACATCT >R922_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CGAAGCCGTATAGCAGCGCGAAAACGGTTTCGAACACGATCAACTGGCCC >R923_0_2_2_0_0_0_0_0_0_0_0_0_0_0 AGGAAAGATAGATCTGAAGAAATACATTGGAATTTTAGAGAATCAATATG >R924_0_0_0_0_0_0_0_0_1_0_0_0_0_0 ACGTAAAAATGCGTCAAATCGCAAAAGATAAAGGCGAGAAAATTAGTGAG >R925_3_0_0_0_0_0_0_0_0_0_0_0_2_0 AAAGTGGGCACAATCACTGACGCTCAAATCCAAGAAATCGCTGCGACTAA >R926_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CATGTGGTTACTTTCCGGACAAATGCCGACGTTGTACGTGACGGGCGAAG >R927_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GGCGGTGCGGCGCGCGTTGAGGATCGCTTGCGTGAGCACGCCCGCCACGA >R928_0_0_0_0_0_0_2_0_0_0_0_0_0_0 GGATTATGGTTACAGCAGCATGTTTAACGACTAGTGTAGGACTTGTTTCA >R929_0_0_0_0_0_0_0_0_0_0_0_0_0_2 CATCAGCAGCCCATTGCCTGTTCCGCCATTTCTGGAGCTGTCGCTCAGTG >R930_0_0_0_0_0_0_0_0_0_0_0_0_1_1 AATGATTACGCCTACAGCGTAACCGCCAGTGTCGAAATTTGCCGTTTTGA >R931_0_0_0_0_0_0_1_0_0_0_0_0_0_0 TCATTCGGGCGCAAGTCTTATCTTTAAAGCAAAGAGAATTTGTTATTGCA >R932_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TTAGTTCTGAAATAGCAATAAACATTGTCGTTGTAATAGCGAACGGGATC >R933_0_0_0_0_0_0_0_0_0_0_0_0_0_1 CACTACGGTGCGAGTGGTCGCTCGGCTGATCCCGTCTGAAGTCGGGATCG >R934_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AGAAGTACAAAAACGATCGAAAGAACGATTTAATATTTATATTGATAAAG >R935_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CGCAATTTGTTCGTGTTCTTGAAGATGATGTGAAAAAGGAATCAGCAAGC >R936_0_0_0_1_0_0_0_0_0_0_0_0_0_0 ACAGCTAGTCAAGAAGAACAGTTTGTAAAACCTCTACTAACAACGAAGCG >R937_1_0_0_0_0_0_0_0_0_0_0_0_1_2 AAAGCAAAAATGTTACAAAATTTATCCAAATGAATAACTTCTAACCTGAA >R938_3_0_0_0_0_0_0_0_0_0_0_0_0_1 ATTCTAGGCAAAAAGATTACATACCGGTTAGTGATGTTAACAATAAAGTA >R939_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GCGCGCGGCCGCCTTGCGCGCGCGCGCCTTCGCGTTCGCCTGCGGCCGCG >R940_0_1_0_0_0_0_0_0_0_0_0_0_0_0 AAACACATGGACTATATACAGTATCATCAAGTCAATCGGCANTTTTGACT >R941_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATGCAATGTTACTTCTTTTGGCGTAGCGGCGAAAGTAGGGAAGACGGTTG >R942_0_0_0_0_0_0_2_0_0_0_0_0_0_0 CATATCAGCATCTTCTGCAATGACAACTTCTTTAACTATACCATTTTTGA >R943_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GAATTTCGCTTCGGATATTAGTTCTATGGCTGCGGAAGGATGTTACTTCG >R944_0_0_0_0_0_0_0_0_1_0_0_0_0_0 AGGATGTTCCATTTGATCGTCTCCTTTATCATGTAATAGATTTTGTGTCC >R945_0_0_0_1_0_0_0_0_0_0_0_0_0_0 CGTTTCAAATCCAGTTAAAACTGTGGCACCTTTAACTGTTGATCCCAACT >R946_0_0_0_0_0_0_1_0_0_0_0_0_0_0 GACCATTATTTTTAAACTGTAATATACCTTGATCTTGATCATACCAATAT >R947_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GACGTCGCGCTCGCGACCGATACGCGGCTGATGCCGGCGATGCGAAAGCC >R948_0_0_0_1_0_0_0_1_0_0_0_0_0_0 GTAAGCACTACACCTATTCATTCTATTCAAAAACAAGAACAAGAGCCGTT >R949_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TGTGGGTATGAAGTTGTAGGAATTAATTATATTGGAGACTGGGGAACACA >R950_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CCGAGTACGAGTAGTGGTAATAGCCGCCGCCGTTCGCGCCGGACCCCATC >R951_0_0_0_0_0_0_0_0_0_0_2_0_0_0 GTGCAGCGTGCGGACCGTCAGGCCGCAGCGTTTCGCCAGTTCTCCGATCT >R952_0_0_0_0_0_0_0_1_0_0_0_0_0_0 CATATCAGCATCTTCTGCAATGACAACTTCTTTAACTATACCATTTTTGN >R953_0_0_0_0_0_0_0_1_0_0_0_0_0_0 TGTAGGTGGTTTAAATTCGTATATTACGTATACATCACCTGAAATGATTG >R954_0_0_0_1_0_0_0_0_0_0_0_0_0_0 GGACATGACGTATATCGCAGCGATTAAAGCAGGCTTTGCCGTAATTCCGA >R955_0_0_0_0_2_0_0_0_0_0_0_0_0_0 AGATGTAGCAATGCGCGCCATTATAAATCCTGATGATGAGGTACTTATTA >R956_0_0_1_0_0_0_0_0_0_0_0_0_0_0 AACTTTTTGATGGTAAATATTCTTATAGTTAGAAGTATTATATTGTTATA >R957_0_0_0_0_0_0_1_0_0_0_0_0_0_0 AGCAATTATACGAACATAAATGAAGATGTCTTTTTATTACCTGTAGAAAA >R958_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TTTCCATCGGCATAGGCCGCATTCAAGGCGGTCTGGATGGCTTCCCGCTC >R959_0_1_1_0_0_0_0_0_0_0_0_0_0_0 AACAATAAGATATGAAAGATTATCAAAGTTTAACAGAACAAATCAATAAT >R960_0_0_0_0_0_3_0_0_0_0_0_0_0_0 CTACTTTAAATGCCCTCCTTTTCTTTCCCCCCACTTCGCAACCGGACTGG >R961_4_0_0_0_0_0_0_0_0_0_0_0_1_0 AGCTCTGTCTCAAGATGGTCAATTGGTGCTATCTAAAGATCATGTTTTGT >R962_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATGGCTATATCTACAGGTAAACCGGTAGCTAATTCAATTCCTGTTGAGGC >R963_0_0_0_0_0_1_0_0_0_0_0_0_0_0 ATCTTCGGATAATACCCCTAACATATCACCCGTTTGGAATCGNNNNNNNN >R964_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CCGCGGCGCGGGCGGCATCGGCCGGAAGATCGCGGTAGAGGCAGCAGAAG >R965_0_0_0_0_0_0_0_0_0_0_0_0_1_0 AAACCCTTAGCTCAACAAAGTGGTTTGCTACTGATGAACCCGCCATATCC >R966_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATTTCTTTTTTGTTTTATTGTTCTGTCCGGTCCACATGTAATAGAAACAT >R967_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TCGACGCTTCGCTTGATAGAACAGTTTGTCTTTCTATTTTTTAAAAACCA >R968_0_0_0_0_0_0_0_0_0_1_0_0_0_0 GGAAACCGTACACGCGTTCGGCGCGATGGAGAAGCCGCCAACCGCGCTCG >R969_0_0_0_0_0_0_0_1_0_0_0_0_0_0 AACCCCCTCATCAGGCTTATCTAGAGCACCAAGAATGTTTAATAATGTAC >R970_0_0_0_0_1_0_0_0_0_0_0_0_0_0 CAGAAGACCATTCGTATGATGGGAAAAGTCCGTATTACAATAGTTGTGAC >R971_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GTGCACGGGAACATCTGGGAGCGCGCAGCGAAAGCCCGCGACGGCTAAGC >R972_0_1_0_0_0_0_0_0_0_0_0_0_0_0 ATATCTTCTGCTAAAGACTCTCTAACTAGCCTTGTAACAATATCATTGGG >R973_0_0_0_0_0_0_0_0_0_1_0_0_0_0 TGGATGAGATCGAGCTCGAGATTGGCGACGCGCAGCACCGGCGCATCGGT >R974_0_0_0_0_0_0_0_0_0_0_0_0_1_0 TTGAGTTGACCGAAATTGAATTAAACCGCGCCAGAATCATTATGATTGAT >R975_0_0_0_0_1_0_0_0_0_0_0_0_0_0 ATCTACATGTGGATAGACTGGGCGTAAAACAAGGAAAGTTATTCACACTA >R976_0_0_0_0_0_0_0_0_0_0_0_1_0_0 ACGGCTCGTCCATCAGCAGCACGCCCGGCTCCATCCCCCGGTCGCGCGCG >R977_0_0_1_0_0_0_0_0_0_0_0_0_0_0 TATAATAACTTTTACTCCAATATCCGGCAAAAGTCATAATAATTCCCCAA >R978_0_0_0_0_0_0_0_0_1_0_0_0_0_0 TTAGACGGGAAGTGAAAGTGTGAAACATGTTTTGAAAAATGATTGGGGGC >R979_0_0_0_0_0_0_0_0_0_0_1_0_0_0 TCTGGAGCCGCGCGCCCGACTACCGCGTGCTGTACAGCAACCTGTCTGAC >R980_0_0_0_0_0_1_0_0_0_0_0_0_0_0 CATTATGGAATAGCAGAATCTTTGTTGGAAAATATTCAGGATCCAATCGA >R981_0_0_0_1_0_0_0_0_0_0_0_0_0_0 TAATCCAGCCTCTGTTAACTGCTCTGCCACAAATATAGAAGACCCTTCTT >R982_0_0_0_0_0_1_0_0_0_0_0_0_0_0 TTTTGCAATTGCTAATCCGAGACCAGATCCACCAGTGTTCGTAGAGCGNN >R983_1_0_0_0_0_0_0_0_0_0_0_0_0_0 TCTGCACCATCTCGATTACATCATGGATAAAGTCGATTTGCTTTTGCTGA >R984_0_0_0_0_0_0_0_0_0_0_0_0_0_2 CACCATGCTGGCAGGCTCGTCTAAGTTAGAGAGGAAGTTGGCAATGCCAC >R985_0_0_1_0_0_0_0_0_0_0_0_0_0_0 ACCAGCTGGCGCTGAAATAACTACTTTTTTAGCACCTGCATGAATATGAG >R986_0_0_0_2_0_0_0_0_0_0_0_0_0_0 AATATAATTTACTCGGAGGAATACCTATGGCAAATAACAATCCTTGGTTA >R987_0_0_0_0_0_0_0_0_0_0_2_0_0_0 GGCCGCGACATCGCGCGGCAGCGCACCCGCACCGATCCGGGTGCGCATCC >R988_0_0_0_0_0_0_0_0_0_0_0_2_0_0 ATGCGGTGCGCGTTGCCAGCAGATTCATGAAACGACCGTACGGCGGGGAC >R989_0_0_0_0_0_0_0_0_0_0_0_0_0_1 GCGGCGTTGGGGGAGGATAAAGCCAACAACTTGGTGGATCAAATTCTGCT >R990_1_0_0_0_0_0_0_0_0_0_0_0_0_1 AATACTACAAAGAAGCGGGTTTGATTAAGTAACGCGTTTCAACTGAGAAG >R991_0_0_0_0_0_0_0_0_0_0_0_0_1_0 ATGGCCAGACTTGAGCAGTCTAAATGTAATGCCACCTCAAACTCCTGATC >R992_0_0_0_0_0_0_0_0_0_1_0_0_0_0 CACGTCACCGCACGACGGGCAGTGGATGATCGGGATCGGCGTGCCCCAGT >R993_0_0_0_0_0_0_0_0_0_0_0_1_0_0 TCGTGAAAATCATTCCCGGCGCGAGACGCAGCCCCGCGCCGGGCCGGCCG >R994_0_0_0_0_0_0_0_0_0_0_1_0_0_0 GAACGCTTCAAGAGCGATCCGCAGAAGATGAACGCGGCGCTGATGGAACT >R995_0_0_0_0_1_0_0_0_0_0_0_0_0_0 AGGTATTCTTTCAATTTTAGTTGGTATTTATGTATTAATTACGATGAAAN >R996_0_0_0_0_0_0_0_0_0_0_0_0_0_1 TCTCTTCATAGACTAAATTTTTGATCTCTTGCATCACCCACTGATGAATC >R997_0_0_0_0_2_0_0_0_0_0_0_0_0_0 GAACAACCGATAGATGGATACACAACAGAAGTAAATGATTATGACATTAC >R998_0_0_0_0_0_0_0_0_0_0_0_1_0_0 GGCTAACGAGGCCCATGTCGTGATGCAGCGGCAGCCAGATCACGGTGTTG >R999_0_0_0_0_1_0_0_0_0_0_0_0_0_0 TCATACATTAAGGGAAGAGATTATTGAGAAACGTGGTGGTAGGTTATTAN
HW1_student_code_example/SPRING2021_INF503_Homework_1.pdf
Homework #1
Due February 16th, 11:59pm
Each homework submission must include:
• An archive (.zip or .gz) file of the source code containing:
o The makefile used to compile the code on Monsoon (5pts)
o All .cpp and .h files (5pts)
o A readme.txt file outlining all modules (if any) needed for the execution of the code and
the exact command lines needed to answer homework’s questions (5pts)
• A full write-up (.pdf of .doc) file containing answers to homework’s questions (5pts) –
screenshots of code output are ok.
The source code must follow the following guidelines:
• No external libraries that implement data structures discussed in class are allowed, unless
specifically stated as part of the problem definition. Standard input/output and utilities libraries
(e.g. math.h) are ok.
• All external data sources (e.g. input data) must be passed in as a command line argument (no
hardcoded paths within the source code.
• Solutions to sub-problems must be executable separately from each other. For example, via a
special flag passed as command line argument (5pts)
For this homework, you will need to use the High Throughput Sequence reads dataset located on
Monsoon: /common/contrib/classroom/inf503/hw_dataset.fa
• Dataset contains approximately 36 million
‘reads’ (genomic sequence fragments of
equal length)
• Each read is exactly 50 nucleotides
(characters) long
• The read set is in FASTA format (see insert)
o The headers are unique and consist
of the read ID number (e.g. R1) and
a series of ‘copy number’ values for
the number of times this read is
present in sample 1, 2, … (separated by underscore “_”)
o The genomic sequences consist of the following alphabet {A, C, G, T, N}
Problem #1 (of 1): Arrays and Classes
Create a class called FASTA_readset. The purpose of the class will be to contain a FASTA read set, all of
the statistics associated with it, and all of the functions needed to operate on this set. Use an array data-
structure to store the genomic sequence of the given read dataset. Use character arrays (char[ ] ) to store
the sequence, rather than ‘string’ object (you should have an array-of-arrays 36 million by 50). Use
another set of arrays to store the copy number counters from the header string. At minimum, the class
must contain:
• A default constructor
• At least one custom constructor (e.g. one taking a file path or ifstream as input)
• A function to read the FASTA fasta file
• A single function to compute all statistics for the Readset (see below)
• A destructor
A. Using the first 1 million reads, estimate and report the total CPU time and RAM it will take to
initialize (fill up) the array data-structure with the entire 36 million reads. Note that this may
mean creating custom constructor to read first X reads rather than to the End-Of-File.
B. Test your prediction using the entire 36 million read set – report actual RAM and CPU time used.
Refer to Monsoon workshop notes for help in estimating actual runtime and RAM usage of your
run. Were you accurate? If not, explain what you think caused the discrepancy.
C. Compute the following statistics for your read set
• Total number of unique sequence fragments (here, safe to assume this is the total
number of sequence fragments in the file).
• Total number of reads for each ‘data set’ separately (recall there are 14 data sets in our
example here). You will need 14 different totals.
• Number of A, C, G, and T characters in the dataset.
D. Implement a destructor for your class to delete / deallocate your array data structure. How long
did it take? Does this make sense to you?
E. Implement a function that would sort the genomic sequences (fragments not characters within a
fragment) in your array in alphabetic order.
• What is the ‘big O’ notation of your approach (linear / quadratic / cubic / etc)? Please
note that depending on the efficiency of your algorithm, you may not be able to
alphabetically sort the entire 36 million reads in a reasonable amount of time (24-36 CPU
hours). If this happens, reduce the problem size (by using a smaller subset of the reads)
and estimate the final run time.
• Print the first 20 lines of the sorted output