diff --git a/README.md b/README.md index 8f6cfd3..d8c4096 100644 --- a/README.md +++ b/README.md @@ -1,10 +1,8 @@ -# Topics: -File I/o (input / output), Arrays +# Introduction to Programming in Java -## Learning Outcomes: +## Contents -- Practice Reading in files to java and processing file text content -- Become comfortable with using arrays to store and retrieve data -- Design and develop programs in accepted style -- Develop further the ability to enhance a program to increase functionality -- Execute the proper steps to write out desired content to a file +**Projects** + +- Calendar +- DNA diff --git a/calendar/README.md b/calendar/README.md new file mode 100644 index 0000000..8f6cfd3 --- /dev/null +++ b/calendar/README.md @@ -0,0 +1,10 @@ +# Topics: +File I/o (input / output), Arrays + +## Learning Outcomes: + +- Practice Reading in files to java and processing file text content +- Become comfortable with using arrays to store and retrieve data +- Design and develop programs in accepted style +- Develop further the ability to enhance a program to increase functionality +- Execute the proper steps to write out desired content to a file diff --git a/dna/DNA.java b/dna/DNA.java new file mode 100644 index 0000000..4cdd31d --- /dev/null +++ b/dna/DNA.java @@ -0,0 +1,332 @@ +import java.util.*; +import java.io.*; +import java.text.*; + +public class DNA { + + int MIN_CODONS = 5; //the minimum number of codons a valid protein must have + int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid + int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T) + public static final int CODONS_PER_NUCLEOTIDE = 3; // the number of nucleotides per codon + public static final String INPUT_DIR = "input/"; // the number of nucleotides per codon + public static final String OUTPUT_DIR = "output/"; // the number of nucleotides per codon + public static final boolean DEBUG = false; // controls print statements for debugging + public static final double[] MOLAR_MASSES = {135.128, 111.103, 151.128, 125.107, 100.00}; + public static final char[] NUCLEOTIDES = {'A', 'T', 'G', 'C', '-'}; + + /* + * + * begins with an introduction and prompts for input and output file names. + * reads the input file to process its nucleotide sequences. + * outputs the results into the given output file. + * + * @return void + * + */ + public static void main(String[] args) throws FileNotFoundException { + Scanner console = new Scanner(System.in); + String[] files = promptForFileNames(console); + File inFile = new File(INPUT_DIR + files[0]); + File outFile = new File(OUTPUT_DIR + files[1]); + if( inFile.canRead() && inFile.exists() ) { + Scanner input = new Scanner(inFile); + + int sequenceCount = linesInFile(inFile) / 2; + + String[] sequences = new String[sequenceCount]; + String[] sequenceNames = new String[sequenceCount]; + + int lineCount = 1; + int sequenceIndex = 0; + while( input.hasNextLine() ) { + String line = input.nextLine(); + if ( lineCount % 2 == 0 ) { + sequences[sequenceIndex] = line.toUpperCase(); + sequenceIndex++; + } + else { + sequenceNames[sequenceIndex] = line; + } + lineCount++; + } + + PrintStream output = new PrintStream(outFile); + saveOutput(sequences, sequenceNames, output); + //output = System.out; + //saveOutput(sequences, sequenceNames, output); + } + } + + /* + * + * Saves output to file using PrintStream as described in Section 6.4 of the textbook. + * overwrites any existing data in the output file (this is the default PrintStream behavior). + * nucleotide sequence is output in uppercase + * the nucleotide counts and mass percentages are shown in A, C, G, T order. + * + * @params path String path of output filename + * @return void; + * + */ + public static void saveOutput(String[] sequences, String[] names, PrintStream output) { + + for( int i = 0; i < sequences.length; i++) { + output.print("Region Name: "); + output.println(names[i]); + output.print("Nucleotides: "); + output.println(sequences[i]); + output.print("Nuc. Counts: "); + output.println(Arrays.toString(nucleotideCountFromSequence(sequences[i]))); + output.print("Total Mass%: "); + output.print(Arrays.toString(nucleotideMassPercentFromSequence(sequences[i]))); + output.println(" of " + totalMassFromSequence(sequences[i])); + output.print("Codons List: "); + output.println(Arrays.toString(codonsFromSequence(sequences[i]))); + output.print("Is Protein?: "); + if(isProtein(sequences[i])) { + output.println("YES"); + } + else { + output.println("NO"); + } + output.println(); + } + } + // return boolean test for protein sequence + public static boolean isProtein(String sequence) { + double[] masses = nucleotideMassPercentFromSequence(sequence); + if(masses[nucleotideIndexFromChar('G')] + masses[nucleotideIndexFromChar('C')] <= 30 ) + { + return false; + } + String[] codons = codonsFromSequence(sequence); + if( ! codons[0].equals("ATG")) + { + return false; + } + if(! codons[codons.length - 1].equals("TAA") && ! codons[codons.length - 1].equals("TAG") && ! codons[codons.length - 1].equals("TGA")) + { + return false; + } + if(codons.length < 5) + { + return false; + } + return true; + } + // non junk masses from sequence + public static double[] nucleotideMassesFromSequence(String sequence) { + double[] masses = new double[4]; + int[] counts = nucleotideCountFromSequence(sequence); + DecimalFormat df = new DecimalFormat("#.##"); + for(int i = 0; i < masses.length; i++) { + masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i])); + } + return masses; + } + // non junk mass percentages from sequence + public static double[] nucleotideMassPercentFromSequence(String sequence) { + double[] masses = nucleotideMassesFromSequence(sequence); + double total = totalMassFromSequence(sequence); + double[] percentages = new double[4]; + DecimalFormat df = new DecimalFormat("#.##"); + for(int i = 0; i < percentages.length; i++) { + percentages[i] = Double.valueOf(df.format(masses[i] / total * 100)); + } + return percentages; + } + // all mass of sequence, junk too + public static double totalMassFromSequence(String sequence) { + DecimalFormat df = new DecimalFormat("#.#"); + double total = 0.0; + + double[] masses = new double[MOLAR_MASSES.length]; + int[] counts = new int[MOLAR_MASSES.length]; + for(int i = 0; i < counts.length; i++) { + counts[i] = nucleotideCount(sequence, NUCLEOTIDES[i]); + } + for(int i = 0; i < masses.length; i++) { + masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i])); + } + for(int i = 0; i < masses.length; i++) { + total += masses[i]; + } + return Double.valueOf(df.format(total)); + } + // count of char nulceotide in sequence + public static int nucleotideCount(String sequence, char nucleotide) { + int count = 0; + for(int i = 0; i < sequence.length(); i++) { + if( sequence.charAt(i) == nucleotide) { + count++; + } + } + return count; + } + + /* + * + * Converts char nucleotide to molar mass + * + * mass percentages, use the following as the mass of each nucleotide (grams/mol). + * "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total. + * Adenine (A): 135.128 + * Cytosine (C): 111.103 + * Guanine (G): 151.128 + * Thymine (T): 125.107 + * Junk (-): 100.000 + * + * @params nucleotide char of nucleotide. + * @return molarMass rounded to nearest tenth. + * + */ + public static double nucleotideToMolarMass(char nucleotide) { + return MOLAR_MASSES[nucleotideIndexFromChar(nucleotide)]; + } + + /* + * + * pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts. + * uses a String.charAt to get individual characters. + * + * @params sequence sequence of + * @return counts array of size 4. + * + */ + public static int[] nucleotideCountFromSequence(String sequence) { + + int[] counts = new int[4]; + for(int i = 0; i < sequence.length(); i++) { + counts[nucleotideIndexFromChar(sequence.charAt(i))]++; + } + return counts; + + } + + /* + * + * converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3). + * includes junk character + * + * @params nucleotide char of nucleotide. + * @return index int mapping of nucleotide. + * + */ + public static int nucleotideIndexFromChar(char nucleotide) { + int index = 0; + if(nucleotide == 'a' || nucleotide =='A') { + index = 0; + } + if(nucleotide == 'c' || nucleotide =='C') { + index = 1; + } + if(nucleotide == 'g' || nucleotide =='G') { + index = 2; + } + if(nucleotide == 't' || nucleotide =='T') { + index = 3; + } + if(nucleotide == '-') { + index = 4; + } + return index; + } + + /* + * + * eliminate these characters. + * + * @params sequence raw sequence + * @return sequence without junk DNA '-'. + * + */ + public static String removeJunk(String sequence) { + String newSequence = ""; + for(int i = 0; i < sequence.length(); i++) { + if(sequence.charAt(i) != '-') { + newSequence += sequence.charAt(i); + } + } + return newSequence; + + } + + /* + * + * break apart the sequence into codons and examine each codon. + * + * @params sequence String of nucleotides or raw. + * @return codons Array of strings of codons. + * + */ + public static String[] codonsFromSequence(String sequence) { + int count = sequence.length() / CODONS_PER_NUCLEOTIDE; + String[] codons = new String[count]; + //String[] codons = new String[sequence.length / CODONS_PER_NUCLEOTIDE + 1]; + String current = ""; + int index = 0; + for(int i = 0; i < sequence.length(); i++) { + current += sequence.charAt(i); + if((i + 1) % CODONS_PER_NUCLEOTIDE == 0 ) { + codons[index] = current; + index++; + current = ""; + } + } + return codons; + + } + + /* + * + * assumes the user will type the name of an existing input file. + * input is in the proper format. + * + * @params console + * @return files array of input and output files for processing and saving + * + */ + public static String[] promptForFileNames(Scanner console) { + System.out.println("This program reports information about DNA"); + System.out.println("nucleotide sequences that may encode"); + System.out.println("proteins."); + + if(DEBUG == true) { + String[] files = {"dna.txt", "dna.txt"}; + return files; + } + + System.out.print("Input file name? "); + String[] files = new String[2]; + files[0] = console.nextLine(); + while( ! validFilename(files[0]) ) { + System.out.print("Input file name? "); + files[0] = console.nextLine(); + } + System.out.print("Output file name? "); + files[1] = console.nextLine(); + while( ! validFilename(files[1]) ) { + System.out.println("Invalid. Try again."); + System.out.print("Output file name?"); + files[1] = console.nextLine(); + } + System.out.println(); + return files; + + } + //count of lines in file + public static int linesInFile(File file) throws FileNotFoundException { + int count = 1; + Scanner input = new Scanner(file); + while( input.hasNextLine() ) { + String line = input.nextLine(); + count++; + } + return count; + } + + //all files are valid + public static boolean validFilename(String name) { + return true; + } +} diff --git a/dna/README.md b/dna/README.md new file mode 100644 index 0000000..e063ab3 --- /dev/null +++ b/dna/README.md @@ -0,0 +1,214 @@ +# Topics: +DNA.java focuses on arrays and file/text processing. +DNA requires the two input files dna.txt and ecoli.txt. +These files are saved in the spec/ folder. This can be changed with INPUT\_PATH. +DNA processes input files, parses the genomic information, and save the output in a new file. + +## Learning Outcomes: + + +#Background +DNA consists of long chains of chemical compounds called nucleotides. +Four nucleotides are present in DNA: Adenine (A), Cytosine (C), Guanine (G), and Thymine (T). +This are organized into subunits called "codons". +Most genes contain condons for building proteins, some do not. +Each codon (e.g. TAC GGA) uniquely encodes a single amino acid, a building block of proteins. +The sequences of DNA that encode proteins occur between a start codon (which we will assume to be ATG) and a stop codon (which is any of TAA, TAG, or TGA). +Not all regions of DNA are genes; large portions that do not lie between a +Start: ATG. +Stop: TAA, TAG, TGA. +Often high percentages of Cytosine (C) and Guanine (G) are indicators of important genetic data. + + +#Input +- The DNA input data consists of line pairs. +- The input file exists, is readable, and contains valid input. +- The first line has the name of the nucleotide sequence. +- The second is the nucleotide sequence itself. +- Each character in a sequence of nucleotides will be A, C, G, T, or a dash character, "-", either upper or lowercase. +- You may assume that each sequence's number of nucleotides (without dashes) will be a multiple of 3, + +##Example + +> cure for cancer protein +> ATGCCACTATGGTAG +> captain picard hair growth protein +> ATgCCAACATGgATGCCcGATAtGGATTgA +> bogus protein +> CCATt-AATgATCa-CAGTt +> ... + +#Process: +- from the original nucleotide sequence string to nucleotide counts. +- from nucleotide counts to mass percentages. +- from the original nucleotide sequence string to codon triplets. + +#Output: + +For each nucleotide sequence: +- nucleotide counts + - Counts the occurrences of each of the four nucleotides ['A', 'C', 'G', 'T']. +- mass percentages + - Calculates the mass percentage occupied by each nucleotide type, rounded to one digit past the decimal point. +- codons + - Reports the codons (TAG) present in each sequence and +- protein-coding gene + - begins with a valid start codon ["ATG"] + - ends with a valid stop codon ["TAA", "TAG", or "TGA") + - contains at least 5 total codons (including its initial start codon and final stop codon) + - Cytosine (C) and Guanine (G) combined account for at least 30% of its total mass + +##Example + +> This program reports information about DNA +> nucleotide sequences that may encode +> proteins. Input file name? dna.txt +> Output file name? output.txt +> Output file output.txt after above execution (partial): +> Region Name: cure for cancer protein +> Nucleotides: ATGCCACTATGGTAG +> Nuc. Counts: [4, 3, 4, 4] +> Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8 +> Codons List: [ATG, CCA, CTA, TGG, TAG] +> Is Protein?: YES +> ... + +#Approach + +##Constants + +```java +int MIN_CODONS = 5; //the minimum number of codons a valid protein must have +int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid +int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T) +int CODONS_PER_NUCLEAOTIDE = 3; // the number of nucleotides per codon +``` + +```java +/* +* +* begins with an introduction and prompts for input and output file names. +* reads the input file to process its nucleotide sequences. +* outputs the results into the given output file. +* +* @return void +* +*/ +public static void main(String[] args) { + +} +``` + +```java +/* +* +* assumes the user will type the name of an existing input file. +* input is in the proper format. +* +* @params console +* @return files array of input and output files for processing and saving +* +*/ +public static String[] promptForFileNames(Scanner console) { + +} +``` + + + +```java +/* +* +* Converts char nucleotide to molar mass +* +* mass percentages, use the following as the mass of each nucleotide (grams/mol). +* "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total. +* Adenine (A): 135.128 +* Cytosine (C): 111.103 +* Guanine (G): 151.128 +* Thymine (T): 125.107 +* Junk (-): 100.000 +* +* @params nucleotide char of nucleotide. +* @return molarMass rounded to nearest tenth. +* +*/ +public static double nucleotideToMolarMass(char nucleotide) { + double[] masses = {135.128, 111.103, 151.128, 125.107}; + double rounded = Math.round(mass * 10.0) / 10.0; +} +``` + +```java +/* +* +* Next, write code to pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts. +* use a String's charAt method to get individual characters. +* +* @params sequence sequence of +* @return counts array of size 4. +* +*/ +public static int[] nucleotideCountFromSequence(String sequence) { + +} +``` + +```java +/* +* +* converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3). +* +* @params nucleotide char of nucleotide. +* @return index int mapping of nucleotide. +* +*/ +public static int nucleotideIndexFromChar(char nucleotide) { + +} +``` + +```java +/* +* +* eliminate these characters. +* +* @params sequence raw sequence +* @return sequence without junk DNA '-'. +* +*/ +public static String nucleotidesOnlyFromSequence(String sequence) { + +} +``` + +```java +/* +* +* break apart the sequence into codons and examine each codon. +* +* @params sequence String of nucleotides or raw. +* @return codons Array of strings of codons. +* +*/ +public static String[] codonsFromSequence(String sequence) { + +} +``` + +```java +/* +* +* Saves output to file using PrintStream as described in Section 6.4 of the textbook. +* overwrites any existing data in the output file (this is the default PrintStream behavior). +* nucleotide sequence is output in uppercase +* the nucleotide counts and mass percentages are shown in A, C, G, T order. +* +* @params path String path of output filename +* @return void; +* +*/ +public static void saveOutput(String path) { + +} +``` diff --git a/dna/input/dna.txt b/dna/input/dna.txt new file mode 100644 index 0000000..0c98d4d --- /dev/null +++ b/dna/input/dna.txt @@ -0,0 +1,18 @@ +cure for cancer protein +ATGCCACTATGGTAG +captain picard hair growth protein +ATgCCAACATGgATGCCcGATAtGGATTgA +bogus protein +CCATtAATgATCaCAGTt +michael jordan mad hops protein +ATgAGATCCgtgatGTGggaTCCTaCTCATTaa +paris hilton phony protein +AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA +george w bush approval rating protein +atgataattagttttaatatcagactgtaa +jimi hendrix guitar talent protein +ATGCAATTGCTCGATTAG +tyler durden's brain protein +ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA +mini me growth hormone +AtGgGaCGCTgA \ No newline at end of file diff --git a/dna/input/ecoli.txt b/dna/input/ecoli.txt new file mode 100644 index 0000000..e9c20cc --- /dev/null +++ b/dna/input/ecoli.txt @@ -0,0 +1,40 @@ +thr operon leader peptide +ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA +aspartokinase I/homoserine dehydrogenase I +ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA +homoserine kinase +ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA +threonine synthase +ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA +hypothetical protein +AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA +Non-protein region +aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC +transaldolase B +ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA +molybdopterin biosynthesis mog protein +ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA +chaperone protein DnaK +aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA +chaperone protein DnaJ +GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA +hypothetical protein +TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA +hypothetical protein +aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA +putative secreted sulfatase +ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa +putative cytoplasmic protein +ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA +sodium/proton antiporter 1 +GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA +transcriptional activator protein NhaR +ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA +riboflavin kinase +ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa +Isoleucyl-tRNA synthetase +ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA +Non-protein region +GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA +FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase +ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA diff --git a/dna/output/dna.txt b/dna/output/dna.txt new file mode 100644 index 0000000..490dddc --- /dev/null +++ b/dna/output/dna.txt @@ -0,0 +1,63 @@ +Region Name: cure for cancer protein +Nucleotides: ATGCCACTATGGTAG +Nuc. Counts: [4, 3, 4, 4] +Total Mass%: [27.32, 16.84, 30.55, 25.29] of 1978.76 +Codons List: [ATG, CCA, CTA, TGG, TAG] +Is Protein?: YES + +Region Name: captain picard hair growth protein +Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA +Nuc. Counts: [9, 6, 8, 7] +Total Mass%: [30.65, 16.8, 30.47, 22.07] of 3967.54 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA] +Is Protein?: YES + +Region Name: bogus protein +Nucleotides: CCATTAATGATCACAGTT +Nuc. Counts: [6, 4, 2, 6] +Total Mass%: [35.13, 19.25, 13.1, 32.52] of 2308.08 +Codons List: [CCA, TTA, ATG, ATC, ACA, GTT] +Is Protein?: NO + +Region Name: michael jordan mad hops protein +Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA +Nuc. Counts: [9, 6, 8, 10] +Total Mass%: [28.0, 15.35, 27.84, 28.81] of 4342.86 +Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA] +Is Protein?: YES + +Region Name: paris hilton phony protein +Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA +Nuc. Counts: [12, 6, 9, 9] +Total Mass%: [33.96, 13.96, 28.49, 23.58] of 4774.27 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA] +Is Protein?: YES + +Region Name: george w bush approval rating protein +Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA +Nuc. Counts: [12, 2, 4, 12] +Total Mass%: [41.06, 5.63, 15.31, 38.01] of 3949.54 +Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA] +Is Protein?: NO + +Region Name: jimi hendrix guitar talent protein +Nucleotides: ATGCAATTGCTCGATTAG +Nuc. Counts: [5, 3, 4, 6] +Total Mass%: [28.58, 14.1, 25.57, 31.75] of 2364.1 +Codons List: [ATG, CAA, TTG, CTC, GAT, TAG] +Is Protein?: YES + +Region Name: tyler durden's brain protein +Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA +Nuc. Counts: [24, 14, 16, 21] +Total Mass%: [32.95, 15.8, 24.56, 26.69] of 9843.81 +Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA] +Is Protein?: YES + +Region Name: mini me growth hormone +Nucleotides: ATGGGACGCTGA +Nuc. Counts: [3, 2, 5, 2] +Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.44 +Codons List: [ATG, GGA, CGC, TGA] +Is Protein?: NO + diff --git a/dna/output/dna_file.txt b/dna/output/dna_file.txt new file mode 100644 index 0000000..a555891 --- /dev/null +++ b/dna/output/dna_file.txt @@ -0,0 +1,63 @@ +Region Name: cure for cancer protein +Nucleotides: ATGCCACTATGGTAG +Nuc. Counts: [4, 3, 4, 4] +Total Mass%: [27.51, 16.96, 30.77, 25.47] of 1964.7 +Codons List: [ATG, CCA, CTA, TGG, TAG] +Is Protein?: YES + +Region Name: captain picard hair growth protein +Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA +Nuc. Counts: [9, 6, 8, 7] +Total Mass%: [30.76, 16.86, 30.58, 22.15] of 3953.5 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA] +Is Protein?: YES + +Region Name: bogus protein +Nucleotides: CCATTAATGATCACAGTT +Nuc. Counts: [6, 4, 2, 6] +Total Mass%: [35.56, 19.49, 13.26, 32.92] of 2280.1 +Codons List: [CCA, TTA, ATG, ATC, ACA, GTT] +Is Protein?: NO + +Region Name: michael jordan mad hops protein +Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA +Nuc. Counts: [9, 6, 8, 10] +Total Mass%: [28.37, 15.55, 28.2, 29.18] of 4286.8 +Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA] +Is Protein?: YES + +Region Name: paris hilton phony protein +Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA +Nuc. Counts: [12, 6, 9, 9] +Total Mass%: [34.27, 14.09, 28.74, 23.79] of 4732.2 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA] +Is Protein?: YES + +Region Name: george w bush approval rating protein +Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA +Nuc. Counts: [12, 2, 4, 12] +Total Mass%: [42.57, 5.83, 15.87, 39.41] of 3809.4 +Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA] +Is Protein?: NO + +Region Name: jimi hendrix guitar talent protein +Nucleotides: ATGCAATTGCTCGATTAG +Nuc. Counts: [5, 3, 4, 6] +Total Mass%: [29.1, 14.35, 26.03, 32.33] of 2322.0 +Codons List: [ATG, CAA, TTG, CTC, GAT, TAG] +Is Protein?: YES + +Region Name: tyler durden's brain protein +Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA +Nuc. Counts: [24, 14, 16, 21] +Total Mass%: [33.28, 15.96, 24.81, 26.96] of 9745.8 +Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA] +Is Protein?: YES + +Region Name: mini me growth hormone +Nucleotides: ATGGGACGCTGA +Nuc. Counts: [3, 2, 5, 2] +Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.4 +Codons List: [ATG, GGA, CGC, TGA] +Is Protein?: NO + diff --git a/dna/output/ecoli.txt b/dna/output/ecoli.txt new file mode 100644 index 0000000..1c21d21 --- /dev/null +++ b/dna/output/ecoli.txt @@ -0,0 +1,140 @@ +Region Name: thr operon leader peptide +Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA +Nuc. Counts: [21, 22, 12, 11] +Total Mass%: [32.9, 28.34, 21.02, 15.95] of 8625.7 +Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA] +Is Protein?: YES + +Region Name: aspartokinase I/homoserine dehydrogenase I +Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA +Nuc. Counts: [551, 608, 692, 612] +Total Mass%: [23.04, 20.91, 32.37, 23.7] of 323096.2 +Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA] +Is Protein?: YES + +Region Name: homoserine kinase +Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA +Nuc. Counts: [193, 226, 295, 219] +Total Mass%: [21.16, 20.37, 36.17, 22.23] of 123268.3 +Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA] +Is Protein?: YES + +Region Name: threonine synthase +Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA +Nuc. Counts: [309, 311, 358, 309] +Total Mass%: [24.69, 20.43, 32.0, 22.86] of 169097.5 +Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA] +Is Protein?: YES + +Region Name: hypothetical protein +Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA +Nuc. Counts: [66, 31, 43, 40] +Total Mass%: [37.57, 14.51, 27.37, 21.08] of 23739.3 +Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA] +Is Protein?: YES + +Region Name: Non-protein region +Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC +Nuc. Counts: [20, 13, 13, 5] +Total Mass%: [39.46, 21.09, 28.68, 9.13] of 6849.2 +Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC] +Is Protein?: NO + +Region Name: transaldolase B +Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA +Nuc. Counts: [252, 236, 256, 210] +Total Mass%: [27.11, 20.88, 30.8, 20.92] of 125598.0 +Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA] +Is Protein?: YES + +Region Name: molybdopterin biosynthesis mog protein +Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA +Nuc. Counts: [139, 143, 175, 131] +Total Mass%: [24.18, 20.45, 34.05, 21.1] of 77675.0 +Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA] +Is Protein?: YES + +Region Name: chaperone protein DnaK +Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA +Nuc. Counts: [541, 475, 504, 397] +Total Mass%: [28.92, 20.88, 30.13, 19.65] of 252806.4 +Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA] +Is Protein?: YES + +Region Name: chaperone protein DnaJ +Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA +Nuc. Counts: [287, 278, 352, 244] +Total Mass%: [25.2, 20.07, 34.57, 19.84] of 153867.6 +Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA] +Is Protein?: NO + +Region Name: hypothetical protein +Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA +Nuc. Counts: [58, 78, 69, 83] +Total Mass%: [21.04, 23.27, 28.0, 27.88] of 37245.0 +Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA] +Is Protein?: NO + +Region Name: hypothetical protein +Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA +Nuc. Counts: [214, 121, 184, 243] +Total Mass%: [29.25, 13.6, 28.13, 30.75] of 98860.9 +Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA] +Is Protein?: YES + +Region Name: putative secreted sulfatase +Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA +Nuc. Counts: [440, 312, 362, 380] +Total Mass%: [30.43, 17.74, 28.0, 24.33] of 195417.1 +Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA] +Is Protein?: YES + +Region Name: putative cytoplasmic protein +Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA +Nuc. Counts: [355, 273, 276, 356] +Total Mass%: [29.36, 18.56, 25.53, 27.26] of 163388.6 +Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA] +Is Protein?: YES + +Region Name: sodium/proton antiporter 1 +Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA +Nuc. Counts: [215, 258, 331, 363] +Total Mass%: [19.15, 18.9, 32.98, 29.94] of 151683.9 +Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA] +Is Protein?: NO + +Region Name: transcriptional activator protein NhaR +Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA +Nuc. Counts: [228, 197, 232, 249] +Total Mass%: [26.07, 18.52, 29.67, 26.36] of 118181.6 +Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA] +Is Protein?: YES + +Region Name: riboflavin kinase +Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA +Nuc. Counts: [213, 221, 276, 232] +Total Mass%: [23.23, 19.81, 33.66, 23.42] of 123918.1 +Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA] +Is Protein?: YES + +Region Name: Isoleucyl-tRNA synthetase +Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA +Nuc. Counts: [660, 720, 817, 620] +Total Mass%: [24.0, 21.53, 33.23, 20.87] of 371617.0 +Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA] +Is Protein?: YES + +Region Name: Non-protein region +Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA +Nuc. Counts: [46, 56, 49, 53] +Total Mass%: [23.44, 23.46, 27.93, 25.01] of 26515.7 +Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA] +Is Protein?: NO + +Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase +Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA +Nuc. Counts: [100, 121, 125, 104] +Total Mass%: [22.87, 22.75, 31.97, 22.02] of 59096.4 +Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA] +Is Protein?: YES + diff --git a/dna/spec/dna.txt b/dna/spec/dna.txt new file mode 100644 index 0000000..0c98d4d --- /dev/null +++ b/dna/spec/dna.txt @@ -0,0 +1,18 @@ +cure for cancer protein +ATGCCACTATGGTAG +captain picard hair growth protein +ATgCCAACATGgATGCCcGATAtGGATTgA +bogus protein +CCATtAATgATCaCAGTt +michael jordan mad hops protein +ATgAGATCCgtgatGTGggaTCCTaCTCATTaa +paris hilton phony protein +AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA +george w bush approval rating protein +atgataattagttttaatatcagactgtaa +jimi hendrix guitar talent protein +ATGCAATTGCTCGATTAG +tyler durden's brain protein +ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA +mini me growth hormone +AtGgGaCGCTgA \ No newline at end of file diff --git a/dna/spec/dna_console.txt b/dna/spec/dna_console.txt new file mode 100644 index 0000000..58d0fef --- /dev/null +++ b/dna/spec/dna_console.txt @@ -0,0 +1,5 @@ +This program reports information about DNA +nucleotide sequences that may encode proteins. + +Input file name? dna.txt +Output file name? dna_file.txt diff --git a/dna/spec/dna_file.txt b/dna/spec/dna_file.txt new file mode 100644 index 0000000..16c267e --- /dev/null +++ b/dna/spec/dna_file.txt @@ -0,0 +1,63 @@ +Region Name: cure for cancer protein +Nucleotides: ATGCCACTATGGTAG +Nuc. Counts: [4, 3, 4, 4] +Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8 +Codons List: [ATG, CCA, CTA, TGG, TAG] +Is Protein?: YES + +Region Name: captain picard hair growth protein +Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA +Nuc. Counts: [9, 6, 8, 7] +Total Mass%: [30.7, 16.8, 30.5, 22.1] of 3967.5 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA] +Is Protein?: YES + +Region Name: bogus protein +Nucleotides: CCATTAATGATCACAGTT +Nuc. Counts: [6, 4, 2, 6] +Total Mass%: [35.1, 19.3, 13.1, 32.5] of 2308.1 +Codons List: [CCA, TTA, ATG, ATC, ACA, GTT] +Is Protein?: NO + +Region Name: michael jordan mad hops protein +Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA +Nuc. Counts: [9, 6, 8, 10] +Total Mass%: [28.0, 15.3, 27.8, 28.8] of 4342.9 +Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA] +Is Protein?: YES + +Region Name: paris hilton phony protein +Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA +Nuc. Counts: [12, 6, 9, 9] +Total Mass%: [34.0, 14.0, 28.5, 23.6] of 4774.3 +Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA] +Is Protein?: YES + +Region Name: george w bush approval rating protein +Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA +Nuc. Counts: [12, 2, 4, 12] +Total Mass%: [41.1, 5.6, 15.3, 38.0] of 3949.5 +Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA] +Is Protein?: NO + +Region Name: jimi hendrix guitar talent protein +Nucleotides: ATGCAATTGCTCGATTAG +Nuc. Counts: [5, 3, 4, 6] +Total Mass%: [28.6, 14.1, 25.6, 31.8] of 2364.1 +Codons List: [ATG, CAA, TTG, CTC, GAT, TAG] +Is Protein?: YES + +Region Name: tyler durden's brain protein +Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA +Nuc. Counts: [24, 14, 16, 21] +Total Mass%: [32.9, 15.8, 24.6, 26.7] of 9843.8 +Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA] +Is Protein?: YES + +Region Name: mini me growth hormone +Nucleotides: ATGGGACGCTGA +Nuc. Counts: [3, 2, 5, 2] +Total Mass%: [24.8, 13.6, 46.3, 15.3] of 1633.4 +Codons List: [ATG, GGA, CGC, TGA] +Is Protein?: NO + diff --git a/dna/spec/ecoli.txt b/dna/spec/ecoli.txt new file mode 100644 index 0000000..e9c20cc --- /dev/null +++ b/dna/spec/ecoli.txt @@ -0,0 +1,40 @@ +thr operon leader peptide +ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA +aspartokinase I/homoserine dehydrogenase I +ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA +homoserine kinase +ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA +threonine synthase +ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA +hypothetical protein +AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA +Non-protein region +aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC +transaldolase B +ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA +molybdopterin biosynthesis mog protein +ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA +chaperone protein DnaK +aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA +chaperone protein DnaJ +GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA +hypothetical protein +TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA +hypothetical protein +aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA +putative secreted sulfatase +ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa +putative cytoplasmic protein +ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA +sodium/proton antiporter 1 +GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA +transcriptional activator protein NhaR +ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA +riboflavin kinase +ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa +Isoleucyl-tRNA synthetase +ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA +Non-protein region +GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA +FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase +ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA diff --git a/dna/spec/ecoli_console.txt b/dna/spec/ecoli_console.txt new file mode 100644 index 0000000..e509eb1 --- /dev/null +++ b/dna/spec/ecoli_console.txt @@ -0,0 +1,5 @@ +This program reports information about DNA +nucleotide sequences that may encode proteins. + +Input file name? ecoli.txt +Output file name? ecoli_file.txt diff --git a/dna/spec/ecoli_file.txt b/dna/spec/ecoli_file.txt new file mode 100644 index 0000000..449f06f --- /dev/null +++ b/dna/spec/ecoli_file.txt @@ -0,0 +1,140 @@ +Region Name: thr operon leader peptide +Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA +Nuc. Counts: [21, 22, 12, 11] +Total Mass%: [33.5, 28.9, 21.4, 16.2] of 8471.7 +Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA] +Is Protein?: YES + +Region Name: aspartokinase I/homoserine dehydrogenase I +Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA +Nuc. Counts: [551, 608, 692, 612] +Total Mass%: [23.0, 20.9, 32.4, 23.7] of 323152.2 +Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA] +Is Protein?: YES + +Region Name: homoserine kinase +Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA +Nuc. Counts: [193, 226, 295, 219] +Total Mass%: [21.2, 20.4, 36.2, 22.2] of 123170.2 +Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA] +Is Protein?: YES + +Region Name: threonine synthase +Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA +Nuc. Counts: [309, 311, 358, 309] +Total Mass%: [24.7, 20.4, 32.0, 22.9] of 169069.5 +Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA] +Is Protein?: YES + +Region Name: hypothetical protein +Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA +Nuc. Counts: [66, 31, 43, 40] +Total Mass%: [37.4, 14.4, 27.2, 21.0] of 23865.4 +Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA] +Is Protein?: YES + +Region Name: Non-protein region +Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC +Nuc. Counts: [20, 13, 13, 5] +Total Mass%: [40.1, 21.4, 29.2, 9.3] of 6737.1 +Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC] +Is Protein?: NO + +Region Name: transaldolase B +Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA +Nuc. Counts: [252, 236, 256, 210] +Total Mass%: [27.2, 20.9, 30.9, 21.0] of 125233.8 +Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA] +Is Protein?: YES + +Region Name: molybdopterin biosynthesis mog protein +Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA +Nuc. Counts: [139, 143, 175, 131] +Total Mass%: [24.2, 20.5, 34.1, 21.1] of 77506.9 +Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA] +Is Protein?: YES + +Region Name: chaperone protein DnaK +Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA +Nuc. Counts: [541, 475, 504, 397] +Total Mass%: [29.0, 21.0, 30.3, 19.7] of 251714.2 +Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA] +Is Protein?: YES + +Region Name: chaperone protein DnaJ +Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA +Nuc. Counts: [287, 278, 352, 244] +Total Mass%: [25.3, 20.1, 34.7, 19.9] of 153391.5 +Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA] +Is Protein?: NO + +Region Name: hypothetical protein +Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA +Nuc. Counts: [58, 78, 69, 83] +Total Mass%: [21.0, 23.2, 27.9, 27.8] of 37315.2 +Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA] +Is Protein?: NO + +Region Name: hypothetical protein +Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA +Nuc. Counts: [214, 121, 184, 243] +Total Mass%: [28.8, 13.4, 27.7, 30.2] of 100569.4 +Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA] +Is Protein?: YES + +Region Name: putative secreted sulfatase +Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA +Nuc. Counts: [440, 312, 362, 380] +Total Mass%: [30.3, 17.7, 27.9, 24.2] of 196369.5 +Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA] +Is Protein?: YES + +Region Name: putative cytoplasmic protein +Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA +Nuc. Counts: [355, 273, 276, 356] +Total Mass%: [29.2, 18.4, 25.3, 27.1] of 164551.0 +Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA] +Is Protein?: YES + +Region Name: sodium/proton antiporter 1 +Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA +Nuc. Counts: [215, 258, 331, 363] +Total Mass%: [19.0, 18.7, 32.7, 29.7] of 153154.3 +Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA] +Is Protein?: NO + +Region Name: transcriptional activator protein NhaR +Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA +Nuc. Counts: [228, 197, 232, 249] +Total Mass%: [25.9, 18.4, 29.5, 26.2] of 118909.8 +Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA] +Is Protein?: YES + +Region Name: riboflavin kinase +Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA +Nuc. Counts: [213, 221, 276, 232] +Total Mass%: [23.2, 19.8, 33.6, 23.4] of 124072.2 +Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA] +Is Protein?: YES + +Region Name: Isoleucyl-tRNA synthetase +Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA +Nuc. Counts: [660, 720, 817, 620] +Total Mass%: [24.1, 21.6, 33.4, 21.0] of 370216.6 +Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA] +Is Protein?: YES + +Region Name: Non-protein region +Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA +Nuc. Counts: [46, 56, 49, 53] +Total Mass%: [23.5, 23.5, 28.0, 25.0] of 26473.6 +Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA] +Is Protein?: NO + +Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase +Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA +Nuc. Counts: [100, 121, 125, 104] +Total Mass%: [23.0, 22.8, 32.1, 22.1] of 58858.4 +Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA] +Is Protein?: YES + diff --git a/dna/spec/spec.pdf b/dna/spec/spec.pdf new file mode 100644 index 0000000..d6d475a Binary files /dev/null and b/dna/spec/spec.pdf differ