move calendar readme to right dir.

add dna assignment.
This commit is contained in:
Matthew Jensen 2019-12-13 14:01:10 -08:00
parent 9e458e8709
commit 7b04c359f4
16 changed files with 1157 additions and 8 deletions

View File

@ -1,10 +1,8 @@
# Topics:
File I/o (input / output), Arrays
# Introduction to Programming in Java
## Learning Outcomes:
## Contents
- Practice Reading in files to java and processing file text content
- Become comfortable with using arrays to store and retrieve data
- Design and develop programs in accepted style
- Develop further the ability to enhance a program to increase functionality
- Execute the proper steps to write out desired content to a file
**Projects**
- Calendar
- DNA

10
calendar/README.md Normal file
View File

@ -0,0 +1,10 @@
# Topics:
File I/o (input / output), Arrays
## Learning Outcomes:
- Practice Reading in files to java and processing file text content
- Become comfortable with using arrays to store and retrieve data
- Design and develop programs in accepted style
- Develop further the ability to enhance a program to increase functionality
- Execute the proper steps to write out desired content to a file

332
dna/DNA.java Normal file
View File

@ -0,0 +1,332 @@
import java.util.*;
import java.io.*;
import java.text.*;
public class DNA {
int MIN_CODONS = 5; //the minimum number of codons a valid protein must have
int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid
int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T)
public static final int CODONS_PER_NUCLEOTIDE = 3; // the number of nucleotides per codon
public static final String INPUT_DIR = "input/"; // the number of nucleotides per codon
public static final String OUTPUT_DIR = "output/"; // the number of nucleotides per codon
public static final boolean DEBUG = false; // controls print statements for debugging
public static final double[] MOLAR_MASSES = {135.128, 111.103, 151.128, 125.107, 100.00};
public static final char[] NUCLEOTIDES = {'A', 'T', 'G', 'C', '-'};
/*
*
* begins with an introduction and prompts for input and output file names.
* reads the input file to process its nucleotide sequences.
* outputs the results into the given output file.
*
* @return void
*
*/
public static void main(String[] args) throws FileNotFoundException {
Scanner console = new Scanner(System.in);
String[] files = promptForFileNames(console);
File inFile = new File(INPUT_DIR + files[0]);
File outFile = new File(OUTPUT_DIR + files[1]);
if( inFile.canRead() && inFile.exists() ) {
Scanner input = new Scanner(inFile);
int sequenceCount = linesInFile(inFile) / 2;
String[] sequences = new String[sequenceCount];
String[] sequenceNames = new String[sequenceCount];
int lineCount = 1;
int sequenceIndex = 0;
while( input.hasNextLine() ) {
String line = input.nextLine();
if ( lineCount % 2 == 0 ) {
sequences[sequenceIndex] = line.toUpperCase();
sequenceIndex++;
}
else {
sequenceNames[sequenceIndex] = line;
}
lineCount++;
}
PrintStream output = new PrintStream(outFile);
saveOutput(sequences, sequenceNames, output);
//output = System.out;
//saveOutput(sequences, sequenceNames, output);
}
}
/*
*
* Saves output to file using PrintStream as described in Section 6.4 of the textbook.
* overwrites any existing data in the output file (this is the default PrintStream behavior).
* nucleotide sequence is output in uppercase
* the nucleotide counts and mass percentages are shown in A, C, G, T order.
*
* @params path String path of output filename
* @return void;
*
*/
public static void saveOutput(String[] sequences, String[] names, PrintStream output) {
for( int i = 0; i < sequences.length; i++) {
output.print("Region Name: ");
output.println(names[i]);
output.print("Nucleotides: ");
output.println(sequences[i]);
output.print("Nuc. Counts: ");
output.println(Arrays.toString(nucleotideCountFromSequence(sequences[i])));
output.print("Total Mass%: ");
output.print(Arrays.toString(nucleotideMassPercentFromSequence(sequences[i])));
output.println(" of " + totalMassFromSequence(sequences[i]));
output.print("Codons List: ");
output.println(Arrays.toString(codonsFromSequence(sequences[i])));
output.print("Is Protein?: ");
if(isProtein(sequences[i])) {
output.println("YES");
}
else {
output.println("NO");
}
output.println();
}
}
// return boolean test for protein sequence
public static boolean isProtein(String sequence) {
double[] masses = nucleotideMassPercentFromSequence(sequence);
if(masses[nucleotideIndexFromChar('G')] + masses[nucleotideIndexFromChar('C')] <= 30 )
{
return false;
}
String[] codons = codonsFromSequence(sequence);
if( ! codons[0].equals("ATG"))
{
return false;
}
if(! codons[codons.length - 1].equals("TAA") && ! codons[codons.length - 1].equals("TAG") && ! codons[codons.length - 1].equals("TGA"))
{
return false;
}
if(codons.length < 5)
{
return false;
}
return true;
}
// non junk masses from sequence
public static double[] nucleotideMassesFromSequence(String sequence) {
double[] masses = new double[4];
int[] counts = nucleotideCountFromSequence(sequence);
DecimalFormat df = new DecimalFormat("#.##");
for(int i = 0; i < masses.length; i++) {
masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i]));
}
return masses;
}
// non junk mass percentages from sequence
public static double[] nucleotideMassPercentFromSequence(String sequence) {
double[] masses = nucleotideMassesFromSequence(sequence);
double total = totalMassFromSequence(sequence);
double[] percentages = new double[4];
DecimalFormat df = new DecimalFormat("#.##");
for(int i = 0; i < percentages.length; i++) {
percentages[i] = Double.valueOf(df.format(masses[i] / total * 100));
}
return percentages;
}
// all mass of sequence, junk too
public static double totalMassFromSequence(String sequence) {
DecimalFormat df = new DecimalFormat("#.#");
double total = 0.0;
double[] masses = new double[MOLAR_MASSES.length];
int[] counts = new int[MOLAR_MASSES.length];
for(int i = 0; i < counts.length; i++) {
counts[i] = nucleotideCount(sequence, NUCLEOTIDES[i]);
}
for(int i = 0; i < masses.length; i++) {
masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i]));
}
for(int i = 0; i < masses.length; i++) {
total += masses[i];
}
return Double.valueOf(df.format(total));
}
// count of char nulceotide in sequence
public static int nucleotideCount(String sequence, char nucleotide) {
int count = 0;
for(int i = 0; i < sequence.length(); i++) {
if( sequence.charAt(i) == nucleotide) {
count++;
}
}
return count;
}
/*
*
* Converts char nucleotide to molar mass
*
* mass percentages, use the following as the mass of each nucleotide (grams/mol).
* "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total.
* Adenine (A): 135.128
* Cytosine (C): 111.103
* Guanine (G): 151.128
* Thymine (T): 125.107
* Junk (-): 100.000
*
* @params nucleotide char of nucleotide.
* @return molarMass rounded to nearest tenth.
*
*/
public static double nucleotideToMolarMass(char nucleotide) {
return MOLAR_MASSES[nucleotideIndexFromChar(nucleotide)];
}
/*
*
* pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts.
* uses a String.charAt to get individual characters.
*
* @params sequence sequence of
* @return counts array of size 4.
*
*/
public static int[] nucleotideCountFromSequence(String sequence) {
int[] counts = new int[4];
for(int i = 0; i < sequence.length(); i++) {
counts[nucleotideIndexFromChar(sequence.charAt(i))]++;
}
return counts;
}
/*
*
* converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3).
* includes junk character
*
* @params nucleotide char of nucleotide.
* @return index int mapping of nucleotide.
*
*/
public static int nucleotideIndexFromChar(char nucleotide) {
int index = 0;
if(nucleotide == 'a' || nucleotide =='A') {
index = 0;
}
if(nucleotide == 'c' || nucleotide =='C') {
index = 1;
}
if(nucleotide == 'g' || nucleotide =='G') {
index = 2;
}
if(nucleotide == 't' || nucleotide =='T') {
index = 3;
}
if(nucleotide == '-') {
index = 4;
}
return index;
}
/*
*
* eliminate these characters.
*
* @params sequence raw sequence
* @return sequence without junk DNA '-'.
*
*/
public static String removeJunk(String sequence) {
String newSequence = "";
for(int i = 0; i < sequence.length(); i++) {
if(sequence.charAt(i) != '-') {
newSequence += sequence.charAt(i);
}
}
return newSequence;
}
/*
*
* break apart the sequence into codons and examine each codon.
*
* @params sequence String of nucleotides or raw.
* @return codons Array of strings of codons.
*
*/
public static String[] codonsFromSequence(String sequence) {
int count = sequence.length() / CODONS_PER_NUCLEOTIDE;
String[] codons = new String[count];
//String[] codons = new String[sequence.length / CODONS_PER_NUCLEOTIDE + 1];
String current = "";
int index = 0;
for(int i = 0; i < sequence.length(); i++) {
current += sequence.charAt(i);
if((i + 1) % CODONS_PER_NUCLEOTIDE == 0 ) {
codons[index] = current;
index++;
current = "";
}
}
return codons;
}
/*
*
* assumes the user will type the name of an existing input file.
* input is in the proper format.
*
* @params console
* @return files array of input and output files for processing and saving
*
*/
public static String[] promptForFileNames(Scanner console) {
System.out.println("This program reports information about DNA");
System.out.println("nucleotide sequences that may encode");
System.out.println("proteins.");
if(DEBUG == true) {
String[] files = {"dna.txt", "dna.txt"};
return files;
}
System.out.print("Input file name? ");
String[] files = new String[2];
files[0] = console.nextLine();
while( ! validFilename(files[0]) ) {
System.out.print("Input file name? ");
files[0] = console.nextLine();
}
System.out.print("Output file name? ");
files[1] = console.nextLine();
while( ! validFilename(files[1]) ) {
System.out.println("Invalid. Try again.");
System.out.print("Output file name?");
files[1] = console.nextLine();
}
System.out.println();
return files;
}
//count of lines in file
public static int linesInFile(File file) throws FileNotFoundException {
int count = 1;
Scanner input = new Scanner(file);
while( input.hasNextLine() ) {
String line = input.nextLine();
count++;
}
return count;
}
//all files are valid
public static boolean validFilename(String name) {
return true;
}
}

214
dna/README.md Normal file
View File

@ -0,0 +1,214 @@
# Topics:
DNA.java focuses on arrays and file/text processing.
DNA requires the two input files dna.txt and ecoli.txt.
These files are saved in the spec/ folder. This can be changed with INPUT\_PATH.
DNA processes input files, parses the genomic information, and save the output in a new file.
## Learning Outcomes:
#Background
DNA consists of long chains of chemical compounds called nucleotides.
Four nucleotides are present in DNA: Adenine (A), Cytosine (C), Guanine (G), and Thymine (T).
This are organized into subunits called "codons".
Most genes contain condons for building proteins, some do not.
Each codon (e.g. TAC GGA) uniquely encodes a single amino acid, a building block of proteins.
The sequences of DNA that encode proteins occur between a start codon (which we will assume to be ATG) and a stop codon (which is any of TAA, TAG, or TGA).
Not all regions of DNA are genes; large portions that do not lie between a
Start: ATG.
Stop: TAA, TAG, TGA.
Often high percentages of Cytosine (C) and Guanine (G) are indicators of important genetic data.
#Input
- The DNA input data consists of line pairs.
- The input file exists, is readable, and contains valid input.
- The first line has the name of the nucleotide sequence.
- The second is the nucleotide sequence itself.
- Each character in a sequence of nucleotides will be A, C, G, T, or a dash character, "-", either upper or lowercase.
- You may assume that each sequence's number of nucleotides (without dashes) will be a multiple of 3,
##Example
> cure for cancer protein
> ATGCCACTATGGTAG
> captain picard hair growth protein
> ATgCCAACATGgATGCCcGATAtGGATTgA
> bogus protein
> CCATt-AATgATCa-CAGTt
> ...
#Process:
- from the original nucleotide sequence string to nucleotide counts.
- from nucleotide counts to mass percentages.
- from the original nucleotide sequence string to codon triplets.
#Output:
For each nucleotide sequence:
- nucleotide counts
- Counts the occurrences of each of the four nucleotides ['A', 'C', 'G', 'T'].
- mass percentages
- Calculates the mass percentage occupied by each nucleotide type, rounded to one digit past the decimal point.
- codons
- Reports the codons (TAG) present in each sequence and
- protein-coding gene
- begins with a valid start codon ["ATG"]
- ends with a valid stop codon ["TAA", "TAG", or "TGA")
- contains at least 5 total codons (including its initial start codon and final stop codon)
- Cytosine (C) and Guanine (G) combined account for at least 30% of its total mass
##Example
> This program reports information about DNA
> nucleotide sequences that may encode
> proteins. Input file name? dna.txt
> Output file name? output.txt
> Output file output.txt after above execution (partial):
> Region Name: cure for cancer protein
> Nucleotides: ATGCCACTATGGTAG
> Nuc. Counts: [4, 3, 4, 4]
> Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8
> Codons List: [ATG, CCA, CTA, TGG, TAG]
> Is Protein?: YES
> ...
#Approach
##Constants
```java
int MIN_CODONS = 5; //the minimum number of codons a valid protein must have
int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid
int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T)
int CODONS_PER_NUCLEAOTIDE = 3; // the number of nucleotides per codon
```
```java
/*
*
* begins with an introduction and prompts for input and output file names.
* reads the input file to process its nucleotide sequences.
* outputs the results into the given output file.
*
* @return void
*
*/
public static void main(String[] args) {
}
```
```java
/*
*
* assumes the user will type the name of an existing input file.
* input is in the proper format.
*
* @params console
* @return files array of input and output files for processing and saving
*
*/
public static String[] promptForFileNames(Scanner console) {
}
```
```java
/*
*
* Converts char nucleotide to molar mass
*
* mass percentages, use the following as the mass of each nucleotide (grams/mol).
* "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total.
* Adenine (A): 135.128
* Cytosine (C): 111.103
* Guanine (G): 151.128
* Thymine (T): 125.107
* Junk (-): 100.000
*
* @params nucleotide char of nucleotide.
* @return molarMass rounded to nearest tenth.
*
*/
public static double nucleotideToMolarMass(char nucleotide) {
double[] masses = {135.128, 111.103, 151.128, 125.107};
double rounded = Math.round(mass * 10.0) / 10.0;
}
```
```java
/*
*
* Next, write code to pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts.
* use a String's charAt method to get individual characters.
*
* @params sequence sequence of
* @return counts array of size 4.
*
*/
public static int[] nucleotideCountFromSequence(String sequence) {
}
```
```java
/*
*
* converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3).
*
* @params nucleotide char of nucleotide.
* @return index int mapping of nucleotide.
*
*/
public static int nucleotideIndexFromChar(char nucleotide) {
}
```
```java
/*
*
* eliminate these characters.
*
* @params sequence raw sequence
* @return sequence without junk DNA '-'.
*
*/
public static String nucleotidesOnlyFromSequence(String sequence) {
}
```
```java
/*
*
* break apart the sequence into codons and examine each codon.
*
* @params sequence String of nucleotides or raw.
* @return codons Array of strings of codons.
*
*/
public static String[] codonsFromSequence(String sequence) {
}
```
```java
/*
*
* Saves output to file using PrintStream as described in Section 6.4 of the textbook.
* overwrites any existing data in the output file (this is the default PrintStream behavior).
* nucleotide sequence is output in uppercase
* the nucleotide counts and mass percentages are shown in A, C, G, T order.
*
* @params path String path of output filename
* @return void;
*
*/
public static void saveOutput(String path) {
}
```

18
dna/input/dna.txt Normal file
View File

@ -0,0 +1,18 @@
cure for cancer protein
ATGCCACTATGGTAG
captain picard hair growth protein
ATgCCAACATGgATGCCcGATAtGGATTgA
bogus protein
CCATtAATgATCaCAGTt
michael jordan mad hops protein
ATgAGATCCgtgatGTGggaTCCTaCTCATTaa
paris hilton phony protein
AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA
george w bush approval rating protein
atgataattagttttaatatcagactgtaa
jimi hendrix guitar talent protein
ATGCAATTGCTCGATTAG
tyler durden's brain protein
ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA
mini me growth hormone
AtGgGaCGCTgA

40
dna/input/ecoli.txt Normal file
View File

@ -0,0 +1,40 @@
thr operon leader peptide
ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA
aspartokinase I/homoserine dehydrogenase I
ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA
homoserine kinase
ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA
threonine synthase
ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA
hypothetical protein
AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA
Non-protein region
aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC
transaldolase B
ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA
molybdopterin biosynthesis mog protein
ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA
chaperone protein DnaK
aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA
chaperone protein DnaJ
GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA
hypothetical protein
TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA
hypothetical protein
aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA
putative secreted sulfatase
ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa
putative cytoplasmic protein
ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA
sodium/proton antiporter 1
GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA
transcriptional activator protein NhaR
ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA
riboflavin kinase
ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa
Isoleucyl-tRNA synthetase
ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA
Non-protein region
GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA
FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA

63
dna/output/dna.txt Normal file
View File

@ -0,0 +1,63 @@
Region Name: cure for cancer protein
Nucleotides: ATGCCACTATGGTAG
Nuc. Counts: [4, 3, 4, 4]
Total Mass%: [27.32, 16.84, 30.55, 25.29] of 1978.76
Codons List: [ATG, CCA, CTA, TGG, TAG]
Is Protein?: YES
Region Name: captain picard hair growth protein
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
Nuc. Counts: [9, 6, 8, 7]
Total Mass%: [30.65, 16.8, 30.47, 22.07] of 3967.54
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
Is Protein?: YES
Region Name: bogus protein
Nucleotides: CCATTAATGATCACAGTT
Nuc. Counts: [6, 4, 2, 6]
Total Mass%: [35.13, 19.25, 13.1, 32.52] of 2308.08
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
Is Protein?: NO
Region Name: michael jordan mad hops protein
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
Nuc. Counts: [9, 6, 8, 10]
Total Mass%: [28.0, 15.35, 27.84, 28.81] of 4342.86
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
Is Protein?: YES
Region Name: paris hilton phony protein
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
Nuc. Counts: [12, 6, 9, 9]
Total Mass%: [33.96, 13.96, 28.49, 23.58] of 4774.27
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
Is Protein?: YES
Region Name: george w bush approval rating protein
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
Nuc. Counts: [12, 2, 4, 12]
Total Mass%: [41.06, 5.63, 15.31, 38.01] of 3949.54
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
Is Protein?: NO
Region Name: jimi hendrix guitar talent protein
Nucleotides: ATGCAATTGCTCGATTAG
Nuc. Counts: [5, 3, 4, 6]
Total Mass%: [28.58, 14.1, 25.57, 31.75] of 2364.1
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
Is Protein?: YES
Region Name: tyler durden's brain protein
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
Nuc. Counts: [24, 14, 16, 21]
Total Mass%: [32.95, 15.8, 24.56, 26.69] of 9843.81
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
Is Protein?: YES
Region Name: mini me growth hormone
Nucleotides: ATGGGACGCTGA
Nuc. Counts: [3, 2, 5, 2]
Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.44
Codons List: [ATG, GGA, CGC, TGA]
Is Protein?: NO

63
dna/output/dna_file.txt Normal file
View File

@ -0,0 +1,63 @@
Region Name: cure for cancer protein
Nucleotides: ATGCCACTATGGTAG
Nuc. Counts: [4, 3, 4, 4]
Total Mass%: [27.51, 16.96, 30.77, 25.47] of 1964.7
Codons List: [ATG, CCA, CTA, TGG, TAG]
Is Protein?: YES
Region Name: captain picard hair growth protein
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
Nuc. Counts: [9, 6, 8, 7]
Total Mass%: [30.76, 16.86, 30.58, 22.15] of 3953.5
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
Is Protein?: YES
Region Name: bogus protein
Nucleotides: CCATTAATGATCACAGTT
Nuc. Counts: [6, 4, 2, 6]
Total Mass%: [35.56, 19.49, 13.26, 32.92] of 2280.1
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
Is Protein?: NO
Region Name: michael jordan mad hops protein
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
Nuc. Counts: [9, 6, 8, 10]
Total Mass%: [28.37, 15.55, 28.2, 29.18] of 4286.8
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
Is Protein?: YES
Region Name: paris hilton phony protein
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
Nuc. Counts: [12, 6, 9, 9]
Total Mass%: [34.27, 14.09, 28.74, 23.79] of 4732.2
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
Is Protein?: YES
Region Name: george w bush approval rating protein
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
Nuc. Counts: [12, 2, 4, 12]
Total Mass%: [42.57, 5.83, 15.87, 39.41] of 3809.4
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
Is Protein?: NO
Region Name: jimi hendrix guitar talent protein
Nucleotides: ATGCAATTGCTCGATTAG
Nuc. Counts: [5, 3, 4, 6]
Total Mass%: [29.1, 14.35, 26.03, 32.33] of 2322.0
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
Is Protein?: YES
Region Name: tyler durden's brain protein
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
Nuc. Counts: [24, 14, 16, 21]
Total Mass%: [33.28, 15.96, 24.81, 26.96] of 9745.8
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
Is Protein?: YES
Region Name: mini me growth hormone
Nucleotides: ATGGGACGCTGA
Nuc. Counts: [3, 2, 5, 2]
Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.4
Codons List: [ATG, GGA, CGC, TGA]
Is Protein?: NO

140
dna/output/ecoli.txt Normal file
View File

@ -0,0 +1,140 @@
Region Name: thr operon leader peptide
Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA
Nuc. Counts: [21, 22, 12, 11]
Total Mass%: [32.9, 28.34, 21.02, 15.95] of 8625.7
Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA]
Is Protein?: YES
Region Name: aspartokinase I/homoserine dehydrogenase I
Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA
Nuc. Counts: [551, 608, 692, 612]
Total Mass%: [23.04, 20.91, 32.37, 23.7] of 323096.2
Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA]
Is Protein?: YES
Region Name: homoserine kinase
Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA
Nuc. Counts: [193, 226, 295, 219]
Total Mass%: [21.16, 20.37, 36.17, 22.23] of 123268.3
Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA]
Is Protein?: YES
Region Name: threonine synthase
Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA
Nuc. Counts: [309, 311, 358, 309]
Total Mass%: [24.69, 20.43, 32.0, 22.86] of 169097.5
Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA]
Is Protein?: YES
Region Name: hypothetical protein
Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA
Nuc. Counts: [66, 31, 43, 40]
Total Mass%: [37.57, 14.51, 27.37, 21.08] of 23739.3
Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA]
Is Protein?: YES
Region Name: Non-protein region
Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC
Nuc. Counts: [20, 13, 13, 5]
Total Mass%: [39.46, 21.09, 28.68, 9.13] of 6849.2
Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC]
Is Protein?: NO
Region Name: transaldolase B
Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA
Nuc. Counts: [252, 236, 256, 210]
Total Mass%: [27.11, 20.88, 30.8, 20.92] of 125598.0
Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA]
Is Protein?: YES
Region Name: molybdopterin biosynthesis mog protein
Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA
Nuc. Counts: [139, 143, 175, 131]
Total Mass%: [24.18, 20.45, 34.05, 21.1] of 77675.0
Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA]
Is Protein?: YES
Region Name: chaperone protein DnaK
Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA
Nuc. Counts: [541, 475, 504, 397]
Total Mass%: [28.92, 20.88, 30.13, 19.65] of 252806.4
Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA]
Is Protein?: YES
Region Name: chaperone protein DnaJ
Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA
Nuc. Counts: [287, 278, 352, 244]
Total Mass%: [25.2, 20.07, 34.57, 19.84] of 153867.6
Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA]
Is Protein?: NO
Region Name: hypothetical protein
Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA
Nuc. Counts: [58, 78, 69, 83]
Total Mass%: [21.04, 23.27, 28.0, 27.88] of 37245.0
Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA]
Is Protein?: NO
Region Name: hypothetical protein
Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA
Nuc. Counts: [214, 121, 184, 243]
Total Mass%: [29.25, 13.6, 28.13, 30.75] of 98860.9
Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA]
Is Protein?: YES
Region Name: putative secreted sulfatase
Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA
Nuc. Counts: [440, 312, 362, 380]
Total Mass%: [30.43, 17.74, 28.0, 24.33] of 195417.1
Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA]
Is Protein?: YES
Region Name: putative cytoplasmic protein
Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA
Nuc. Counts: [355, 273, 276, 356]
Total Mass%: [29.36, 18.56, 25.53, 27.26] of 163388.6
Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA]
Is Protein?: YES
Region Name: sodium/proton antiporter 1
Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA
Nuc. Counts: [215, 258, 331, 363]
Total Mass%: [19.15, 18.9, 32.98, 29.94] of 151683.9
Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA]
Is Protein?: NO
Region Name: transcriptional activator protein NhaR
Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA
Nuc. Counts: [228, 197, 232, 249]
Total Mass%: [26.07, 18.52, 29.67, 26.36] of 118181.6
Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA]
Is Protein?: YES
Region Name: riboflavin kinase
Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA
Nuc. Counts: [213, 221, 276, 232]
Total Mass%: [23.23, 19.81, 33.66, 23.42] of 123918.1
Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA]
Is Protein?: YES
Region Name: Isoleucyl-tRNA synthetase
Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA
Nuc. Counts: [660, 720, 817, 620]
Total Mass%: [24.0, 21.53, 33.23, 20.87] of 371617.0
Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA]
Is Protein?: YES
Region Name: Non-protein region
Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA
Nuc. Counts: [46, 56, 49, 53]
Total Mass%: [23.44, 23.46, 27.93, 25.01] of 26515.7
Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA]
Is Protein?: NO
Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA
Nuc. Counts: [100, 121, 125, 104]
Total Mass%: [22.87, 22.75, 31.97, 22.02] of 59096.4
Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA]
Is Protein?: YES

18
dna/spec/dna.txt Normal file
View File

@ -0,0 +1,18 @@
cure for cancer protein
ATGCCACTATGGTAG
captain picard hair growth protein
ATgCCAACATGgATGCCcGATAtGGATTgA
bogus protein
CCATtAATgATCaCAGTt
michael jordan mad hops protein
ATgAGATCCgtgatGTGggaTCCTaCTCATTaa
paris hilton phony protein
AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA
george w bush approval rating protein
atgataattagttttaatatcagactgtaa
jimi hendrix guitar talent protein
ATGCAATTGCTCGATTAG
tyler durden's brain protein
ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA
mini me growth hormone
AtGgGaCGCTgA

5
dna/spec/dna_console.txt Normal file
View File

@ -0,0 +1,5 @@
This program reports information about DNA
nucleotide sequences that may encode proteins.
Input file name? dna.txt
Output file name? dna_file.txt

63
dna/spec/dna_file.txt Normal file
View File

@ -0,0 +1,63 @@
Region Name: cure for cancer protein
Nucleotides: ATGCCACTATGGTAG
Nuc. Counts: [4, 3, 4, 4]
Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8
Codons List: [ATG, CCA, CTA, TGG, TAG]
Is Protein?: YES
Region Name: captain picard hair growth protein
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
Nuc. Counts: [9, 6, 8, 7]
Total Mass%: [30.7, 16.8, 30.5, 22.1] of 3967.5
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
Is Protein?: YES
Region Name: bogus protein
Nucleotides: CCATTAATGATCACAGTT
Nuc. Counts: [6, 4, 2, 6]
Total Mass%: [35.1, 19.3, 13.1, 32.5] of 2308.1
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
Is Protein?: NO
Region Name: michael jordan mad hops protein
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
Nuc. Counts: [9, 6, 8, 10]
Total Mass%: [28.0, 15.3, 27.8, 28.8] of 4342.9
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
Is Protein?: YES
Region Name: paris hilton phony protein
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
Nuc. Counts: [12, 6, 9, 9]
Total Mass%: [34.0, 14.0, 28.5, 23.6] of 4774.3
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
Is Protein?: YES
Region Name: george w bush approval rating protein
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
Nuc. Counts: [12, 2, 4, 12]
Total Mass%: [41.1, 5.6, 15.3, 38.0] of 3949.5
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
Is Protein?: NO
Region Name: jimi hendrix guitar talent protein
Nucleotides: ATGCAATTGCTCGATTAG
Nuc. Counts: [5, 3, 4, 6]
Total Mass%: [28.6, 14.1, 25.6, 31.8] of 2364.1
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
Is Protein?: YES
Region Name: tyler durden's brain protein
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
Nuc. Counts: [24, 14, 16, 21]
Total Mass%: [32.9, 15.8, 24.6, 26.7] of 9843.8
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
Is Protein?: YES
Region Name: mini me growth hormone
Nucleotides: ATGGGACGCTGA
Nuc. Counts: [3, 2, 5, 2]
Total Mass%: [24.8, 13.6, 46.3, 15.3] of 1633.4
Codons List: [ATG, GGA, CGC, TGA]
Is Protein?: NO

40
dna/spec/ecoli.txt Normal file
View File

@ -0,0 +1,40 @@
thr operon leader peptide
ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA
aspartokinase I/homoserine dehydrogenase I
ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA
homoserine kinase
ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA
threonine synthase
ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA
hypothetical protein
AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA
Non-protein region
aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC
transaldolase B
ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA
molybdopterin biosynthesis mog protein
ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA
chaperone protein DnaK
aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA
chaperone protein DnaJ
GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA
hypothetical protein
TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA
hypothetical protein
aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA
putative secreted sulfatase
ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa
putative cytoplasmic protein
ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA
sodium/proton antiporter 1
GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA
transcriptional activator protein NhaR
ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA
riboflavin kinase
ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa
Isoleucyl-tRNA synthetase
ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA
Non-protein region
GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA
FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA

View File

@ -0,0 +1,5 @@
This program reports information about DNA
nucleotide sequences that may encode proteins.
Input file name? ecoli.txt
Output file name? ecoli_file.txt

140
dna/spec/ecoli_file.txt Normal file
View File

@ -0,0 +1,140 @@
Region Name: thr operon leader peptide
Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA
Nuc. Counts: [21, 22, 12, 11]
Total Mass%: [33.5, 28.9, 21.4, 16.2] of 8471.7
Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA]
Is Protein?: YES
Region Name: aspartokinase I/homoserine dehydrogenase I
Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA
Nuc. Counts: [551, 608, 692, 612]
Total Mass%: [23.0, 20.9, 32.4, 23.7] of 323152.2
Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA]
Is Protein?: YES
Region Name: homoserine kinase
Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA
Nuc. Counts: [193, 226, 295, 219]
Total Mass%: [21.2, 20.4, 36.2, 22.2] of 123170.2
Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA]
Is Protein?: YES
Region Name: threonine synthase
Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA
Nuc. Counts: [309, 311, 358, 309]
Total Mass%: [24.7, 20.4, 32.0, 22.9] of 169069.5
Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA]
Is Protein?: YES
Region Name: hypothetical protein
Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA
Nuc. Counts: [66, 31, 43, 40]
Total Mass%: [37.4, 14.4, 27.2, 21.0] of 23865.4
Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA]
Is Protein?: YES
Region Name: Non-protein region
Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC
Nuc. Counts: [20, 13, 13, 5]
Total Mass%: [40.1, 21.4, 29.2, 9.3] of 6737.1
Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC]
Is Protein?: NO
Region Name: transaldolase B
Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA
Nuc. Counts: [252, 236, 256, 210]
Total Mass%: [27.2, 20.9, 30.9, 21.0] of 125233.8
Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA]
Is Protein?: YES
Region Name: molybdopterin biosynthesis mog protein
Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA
Nuc. Counts: [139, 143, 175, 131]
Total Mass%: [24.2, 20.5, 34.1, 21.1] of 77506.9
Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA]
Is Protein?: YES
Region Name: chaperone protein DnaK
Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA
Nuc. Counts: [541, 475, 504, 397]
Total Mass%: [29.0, 21.0, 30.3, 19.7] of 251714.2
Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA]
Is Protein?: YES
Region Name: chaperone protein DnaJ
Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA
Nuc. Counts: [287, 278, 352, 244]
Total Mass%: [25.3, 20.1, 34.7, 19.9] of 153391.5
Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA]
Is Protein?: NO
Region Name: hypothetical protein
Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA
Nuc. Counts: [58, 78, 69, 83]
Total Mass%: [21.0, 23.2, 27.9, 27.8] of 37315.2
Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA]
Is Protein?: NO
Region Name: hypothetical protein
Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA
Nuc. Counts: [214, 121, 184, 243]
Total Mass%: [28.8, 13.4, 27.7, 30.2] of 100569.4
Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA]
Is Protein?: YES
Region Name: putative secreted sulfatase
Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA
Nuc. Counts: [440, 312, 362, 380]
Total Mass%: [30.3, 17.7, 27.9, 24.2] of 196369.5
Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA]
Is Protein?: YES
Region Name: putative cytoplasmic protein
Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA
Nuc. Counts: [355, 273, 276, 356]
Total Mass%: [29.2, 18.4, 25.3, 27.1] of 164551.0
Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA]
Is Protein?: YES
Region Name: sodium/proton antiporter 1
Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA
Nuc. Counts: [215, 258, 331, 363]
Total Mass%: [19.0, 18.7, 32.7, 29.7] of 153154.3
Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA]
Is Protein?: NO
Region Name: transcriptional activator protein NhaR
Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA
Nuc. Counts: [228, 197, 232, 249]
Total Mass%: [25.9, 18.4, 29.5, 26.2] of 118909.8
Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA]
Is Protein?: YES
Region Name: riboflavin kinase
Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA
Nuc. Counts: [213, 221, 276, 232]
Total Mass%: [23.2, 19.8, 33.6, 23.4] of 124072.2
Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA]
Is Protein?: YES
Region Name: Isoleucyl-tRNA synthetase
Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA
Nuc. Counts: [660, 720, 817, 620]
Total Mass%: [24.1, 21.6, 33.4, 21.0] of 370216.6
Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA]
Is Protein?: YES
Region Name: Non-protein region
Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA
Nuc. Counts: [46, 56, 49, 53]
Total Mass%: [23.5, 23.5, 28.0, 25.0] of 26473.6
Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA]
Is Protein?: NO
Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA
Nuc. Counts: [100, 121, 125, 104]
Total Mass%: [23.0, 22.8, 32.1, 22.1] of 58858.4
Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA]
Is Protein?: YES

BIN
dna/spec/spec.pdf Normal file

Binary file not shown.