parent
9e458e8709
commit
7b04c359f4
14
README.md
14
README.md
|
@ -1,10 +1,8 @@
|
||||||
# Topics:
|
# Introduction to Programming in Java
|
||||||
File I/o (input / output), Arrays
|
|
||||||
|
|
||||||
## Learning Outcomes:
|
## Contents
|
||||||
|
|
||||||
- Practice Reading in files to java and processing file text content
|
**Projects**
|
||||||
- Become comfortable with using arrays to store and retrieve data
|
|
||||||
- Design and develop programs in accepted style
|
- Calendar
|
||||||
- Develop further the ability to enhance a program to increase functionality
|
- DNA
|
||||||
- Execute the proper steps to write out desired content to a file
|
|
||||||
|
|
|
@ -0,0 +1,10 @@
|
||||||
|
# Topics:
|
||||||
|
File I/o (input / output), Arrays
|
||||||
|
|
||||||
|
## Learning Outcomes:
|
||||||
|
|
||||||
|
- Practice Reading in files to java and processing file text content
|
||||||
|
- Become comfortable with using arrays to store and retrieve data
|
||||||
|
- Design and develop programs in accepted style
|
||||||
|
- Develop further the ability to enhance a program to increase functionality
|
||||||
|
- Execute the proper steps to write out desired content to a file
|
|
@ -0,0 +1,332 @@
|
||||||
|
import java.util.*;
|
||||||
|
import java.io.*;
|
||||||
|
import java.text.*;
|
||||||
|
|
||||||
|
public class DNA {
|
||||||
|
|
||||||
|
int MIN_CODONS = 5; //the minimum number of codons a valid protein must have
|
||||||
|
int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid
|
||||||
|
int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T)
|
||||||
|
public static final int CODONS_PER_NUCLEOTIDE = 3; // the number of nucleotides per codon
|
||||||
|
public static final String INPUT_DIR = "input/"; // the number of nucleotides per codon
|
||||||
|
public static final String OUTPUT_DIR = "output/"; // the number of nucleotides per codon
|
||||||
|
public static final boolean DEBUG = false; // controls print statements for debugging
|
||||||
|
public static final double[] MOLAR_MASSES = {135.128, 111.103, 151.128, 125.107, 100.00};
|
||||||
|
public static final char[] NUCLEOTIDES = {'A', 'T', 'G', 'C', '-'};
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* begins with an introduction and prompts for input and output file names.
|
||||||
|
* reads the input file to process its nucleotide sequences.
|
||||||
|
* outputs the results into the given output file.
|
||||||
|
*
|
||||||
|
* @return void
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static void main(String[] args) throws FileNotFoundException {
|
||||||
|
Scanner console = new Scanner(System.in);
|
||||||
|
String[] files = promptForFileNames(console);
|
||||||
|
File inFile = new File(INPUT_DIR + files[0]);
|
||||||
|
File outFile = new File(OUTPUT_DIR + files[1]);
|
||||||
|
if( inFile.canRead() && inFile.exists() ) {
|
||||||
|
Scanner input = new Scanner(inFile);
|
||||||
|
|
||||||
|
int sequenceCount = linesInFile(inFile) / 2;
|
||||||
|
|
||||||
|
String[] sequences = new String[sequenceCount];
|
||||||
|
String[] sequenceNames = new String[sequenceCount];
|
||||||
|
|
||||||
|
int lineCount = 1;
|
||||||
|
int sequenceIndex = 0;
|
||||||
|
while( input.hasNextLine() ) {
|
||||||
|
String line = input.nextLine();
|
||||||
|
if ( lineCount % 2 == 0 ) {
|
||||||
|
sequences[sequenceIndex] = line.toUpperCase();
|
||||||
|
sequenceIndex++;
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
sequenceNames[sequenceIndex] = line;
|
||||||
|
}
|
||||||
|
lineCount++;
|
||||||
|
}
|
||||||
|
|
||||||
|
PrintStream output = new PrintStream(outFile);
|
||||||
|
saveOutput(sequences, sequenceNames, output);
|
||||||
|
//output = System.out;
|
||||||
|
//saveOutput(sequences, sequenceNames, output);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* Saves output to file using PrintStream as described in Section 6.4 of the textbook.
|
||||||
|
* overwrites any existing data in the output file (this is the default PrintStream behavior).
|
||||||
|
* nucleotide sequence is output in uppercase
|
||||||
|
* the nucleotide counts and mass percentages are shown in A, C, G, T order.
|
||||||
|
*
|
||||||
|
* @params path String path of output filename
|
||||||
|
* @return void;
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static void saveOutput(String[] sequences, String[] names, PrintStream output) {
|
||||||
|
|
||||||
|
for( int i = 0; i < sequences.length; i++) {
|
||||||
|
output.print("Region Name: ");
|
||||||
|
output.println(names[i]);
|
||||||
|
output.print("Nucleotides: ");
|
||||||
|
output.println(sequences[i]);
|
||||||
|
output.print("Nuc. Counts: ");
|
||||||
|
output.println(Arrays.toString(nucleotideCountFromSequence(sequences[i])));
|
||||||
|
output.print("Total Mass%: ");
|
||||||
|
output.print(Arrays.toString(nucleotideMassPercentFromSequence(sequences[i])));
|
||||||
|
output.println(" of " + totalMassFromSequence(sequences[i]));
|
||||||
|
output.print("Codons List: ");
|
||||||
|
output.println(Arrays.toString(codonsFromSequence(sequences[i])));
|
||||||
|
output.print("Is Protein?: ");
|
||||||
|
if(isProtein(sequences[i])) {
|
||||||
|
output.println("YES");
|
||||||
|
}
|
||||||
|
else {
|
||||||
|
output.println("NO");
|
||||||
|
}
|
||||||
|
output.println();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// return boolean test for protein sequence
|
||||||
|
public static boolean isProtein(String sequence) {
|
||||||
|
double[] masses = nucleotideMassPercentFromSequence(sequence);
|
||||||
|
if(masses[nucleotideIndexFromChar('G')] + masses[nucleotideIndexFromChar('C')] <= 30 )
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
String[] codons = codonsFromSequence(sequence);
|
||||||
|
if( ! codons[0].equals("ATG"))
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if(! codons[codons.length - 1].equals("TAA") && ! codons[codons.length - 1].equals("TAG") && ! codons[codons.length - 1].equals("TGA"))
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if(codons.length < 5)
|
||||||
|
{
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
// non junk masses from sequence
|
||||||
|
public static double[] nucleotideMassesFromSequence(String sequence) {
|
||||||
|
double[] masses = new double[4];
|
||||||
|
int[] counts = nucleotideCountFromSequence(sequence);
|
||||||
|
DecimalFormat df = new DecimalFormat("#.##");
|
||||||
|
for(int i = 0; i < masses.length; i++) {
|
||||||
|
masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i]));
|
||||||
|
}
|
||||||
|
return masses;
|
||||||
|
}
|
||||||
|
// non junk mass percentages from sequence
|
||||||
|
public static double[] nucleotideMassPercentFromSequence(String sequence) {
|
||||||
|
double[] masses = nucleotideMassesFromSequence(sequence);
|
||||||
|
double total = totalMassFromSequence(sequence);
|
||||||
|
double[] percentages = new double[4];
|
||||||
|
DecimalFormat df = new DecimalFormat("#.##");
|
||||||
|
for(int i = 0; i < percentages.length; i++) {
|
||||||
|
percentages[i] = Double.valueOf(df.format(masses[i] / total * 100));
|
||||||
|
}
|
||||||
|
return percentages;
|
||||||
|
}
|
||||||
|
// all mass of sequence, junk too
|
||||||
|
public static double totalMassFromSequence(String sequence) {
|
||||||
|
DecimalFormat df = new DecimalFormat("#.#");
|
||||||
|
double total = 0.0;
|
||||||
|
|
||||||
|
double[] masses = new double[MOLAR_MASSES.length];
|
||||||
|
int[] counts = new int[MOLAR_MASSES.length];
|
||||||
|
for(int i = 0; i < counts.length; i++) {
|
||||||
|
counts[i] = nucleotideCount(sequence, NUCLEOTIDES[i]);
|
||||||
|
}
|
||||||
|
for(int i = 0; i < masses.length; i++) {
|
||||||
|
masses[i] = Double.valueOf(df.format(counts[i] * MOLAR_MASSES[i]));
|
||||||
|
}
|
||||||
|
for(int i = 0; i < masses.length; i++) {
|
||||||
|
total += masses[i];
|
||||||
|
}
|
||||||
|
return Double.valueOf(df.format(total));
|
||||||
|
}
|
||||||
|
// count of char nulceotide in sequence
|
||||||
|
public static int nucleotideCount(String sequence, char nucleotide) {
|
||||||
|
int count = 0;
|
||||||
|
for(int i = 0; i < sequence.length(); i++) {
|
||||||
|
if( sequence.charAt(i) == nucleotide) {
|
||||||
|
count++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return count;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* Converts char nucleotide to molar mass
|
||||||
|
*
|
||||||
|
* mass percentages, use the following as the mass of each nucleotide (grams/mol).
|
||||||
|
* "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total.
|
||||||
|
* Adenine (A): 135.128
|
||||||
|
* Cytosine (C): 111.103
|
||||||
|
* Guanine (G): 151.128
|
||||||
|
* Thymine (T): 125.107
|
||||||
|
* Junk (-): 100.000
|
||||||
|
*
|
||||||
|
* @params nucleotide char of nucleotide.
|
||||||
|
* @return molarMass rounded to nearest tenth.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static double nucleotideToMolarMass(char nucleotide) {
|
||||||
|
return MOLAR_MASSES[nucleotideIndexFromChar(nucleotide)];
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts.
|
||||||
|
* uses a String.charAt to get individual characters.
|
||||||
|
*
|
||||||
|
* @params sequence sequence of
|
||||||
|
* @return counts array of size 4.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static int[] nucleotideCountFromSequence(String sequence) {
|
||||||
|
|
||||||
|
int[] counts = new int[4];
|
||||||
|
for(int i = 0; i < sequence.length(); i++) {
|
||||||
|
counts[nucleotideIndexFromChar(sequence.charAt(i))]++;
|
||||||
|
}
|
||||||
|
return counts;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3).
|
||||||
|
* includes junk character
|
||||||
|
*
|
||||||
|
* @params nucleotide char of nucleotide.
|
||||||
|
* @return index int mapping of nucleotide.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static int nucleotideIndexFromChar(char nucleotide) {
|
||||||
|
int index = 0;
|
||||||
|
if(nucleotide == 'a' || nucleotide =='A') {
|
||||||
|
index = 0;
|
||||||
|
}
|
||||||
|
if(nucleotide == 'c' || nucleotide =='C') {
|
||||||
|
index = 1;
|
||||||
|
}
|
||||||
|
if(nucleotide == 'g' || nucleotide =='G') {
|
||||||
|
index = 2;
|
||||||
|
}
|
||||||
|
if(nucleotide == 't' || nucleotide =='T') {
|
||||||
|
index = 3;
|
||||||
|
}
|
||||||
|
if(nucleotide == '-') {
|
||||||
|
index = 4;
|
||||||
|
}
|
||||||
|
return index;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* eliminate these characters.
|
||||||
|
*
|
||||||
|
* @params sequence raw sequence
|
||||||
|
* @return sequence without junk DNA '-'.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String removeJunk(String sequence) {
|
||||||
|
String newSequence = "";
|
||||||
|
for(int i = 0; i < sequence.length(); i++) {
|
||||||
|
if(sequence.charAt(i) != '-') {
|
||||||
|
newSequence += sequence.charAt(i);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return newSequence;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* break apart the sequence into codons and examine each codon.
|
||||||
|
*
|
||||||
|
* @params sequence String of nucleotides or raw.
|
||||||
|
* @return codons Array of strings of codons.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String[] codonsFromSequence(String sequence) {
|
||||||
|
int count = sequence.length() / CODONS_PER_NUCLEOTIDE;
|
||||||
|
String[] codons = new String[count];
|
||||||
|
//String[] codons = new String[sequence.length / CODONS_PER_NUCLEOTIDE + 1];
|
||||||
|
String current = "";
|
||||||
|
int index = 0;
|
||||||
|
for(int i = 0; i < sequence.length(); i++) {
|
||||||
|
current += sequence.charAt(i);
|
||||||
|
if((i + 1) % CODONS_PER_NUCLEOTIDE == 0 ) {
|
||||||
|
codons[index] = current;
|
||||||
|
index++;
|
||||||
|
current = "";
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return codons;
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* assumes the user will type the name of an existing input file.
|
||||||
|
* input is in the proper format.
|
||||||
|
*
|
||||||
|
* @params console
|
||||||
|
* @return files array of input and output files for processing and saving
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String[] promptForFileNames(Scanner console) {
|
||||||
|
System.out.println("This program reports information about DNA");
|
||||||
|
System.out.println("nucleotide sequences that may encode");
|
||||||
|
System.out.println("proteins.");
|
||||||
|
|
||||||
|
if(DEBUG == true) {
|
||||||
|
String[] files = {"dna.txt", "dna.txt"};
|
||||||
|
return files;
|
||||||
|
}
|
||||||
|
|
||||||
|
System.out.print("Input file name? ");
|
||||||
|
String[] files = new String[2];
|
||||||
|
files[0] = console.nextLine();
|
||||||
|
while( ! validFilename(files[0]) ) {
|
||||||
|
System.out.print("Input file name? ");
|
||||||
|
files[0] = console.nextLine();
|
||||||
|
}
|
||||||
|
System.out.print("Output file name? ");
|
||||||
|
files[1] = console.nextLine();
|
||||||
|
while( ! validFilename(files[1]) ) {
|
||||||
|
System.out.println("Invalid. Try again.");
|
||||||
|
System.out.print("Output file name?");
|
||||||
|
files[1] = console.nextLine();
|
||||||
|
}
|
||||||
|
System.out.println();
|
||||||
|
return files;
|
||||||
|
|
||||||
|
}
|
||||||
|
//count of lines in file
|
||||||
|
public static int linesInFile(File file) throws FileNotFoundException {
|
||||||
|
int count = 1;
|
||||||
|
Scanner input = new Scanner(file);
|
||||||
|
while( input.hasNextLine() ) {
|
||||||
|
String line = input.nextLine();
|
||||||
|
count++;
|
||||||
|
}
|
||||||
|
return count;
|
||||||
|
}
|
||||||
|
|
||||||
|
//all files are valid
|
||||||
|
public static boolean validFilename(String name) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,214 @@
|
||||||
|
# Topics:
|
||||||
|
DNA.java focuses on arrays and file/text processing.
|
||||||
|
DNA requires the two input files dna.txt and ecoli.txt.
|
||||||
|
These files are saved in the spec/ folder. This can be changed with INPUT\_PATH.
|
||||||
|
DNA processes input files, parses the genomic information, and save the output in a new file.
|
||||||
|
|
||||||
|
## Learning Outcomes:
|
||||||
|
|
||||||
|
|
||||||
|
#Background
|
||||||
|
DNA consists of long chains of chemical compounds called nucleotides.
|
||||||
|
Four nucleotides are present in DNA: Adenine (A), Cytosine (C), Guanine (G), and Thymine (T).
|
||||||
|
This are organized into subunits called "codons".
|
||||||
|
Most genes contain condons for building proteins, some do not.
|
||||||
|
Each codon (e.g. TAC GGA) uniquely encodes a single amino acid, a building block of proteins.
|
||||||
|
The sequences of DNA that encode proteins occur between a start codon (which we will assume to be ATG) and a stop codon (which is any of TAA, TAG, or TGA).
|
||||||
|
Not all regions of DNA are genes; large portions that do not lie between a
|
||||||
|
Start: ATG.
|
||||||
|
Stop: TAA, TAG, TGA.
|
||||||
|
Often high percentages of Cytosine (C) and Guanine (G) are indicators of important genetic data.
|
||||||
|
|
||||||
|
|
||||||
|
#Input
|
||||||
|
- The DNA input data consists of line pairs.
|
||||||
|
- The input file exists, is readable, and contains valid input.
|
||||||
|
- The first line has the name of the nucleotide sequence.
|
||||||
|
- The second is the nucleotide sequence itself.
|
||||||
|
- Each character in a sequence of nucleotides will be A, C, G, T, or a dash character, "-", either upper or lowercase.
|
||||||
|
- You may assume that each sequence's number of nucleotides (without dashes) will be a multiple of 3,
|
||||||
|
|
||||||
|
##Example
|
||||||
|
|
||||||
|
> cure for cancer protein
|
||||||
|
> ATGCCACTATGGTAG
|
||||||
|
> captain picard hair growth protein
|
||||||
|
> ATgCCAACATGgATGCCcGATAtGGATTgA
|
||||||
|
> bogus protein
|
||||||
|
> CCATt-AATgATCa-CAGTt
|
||||||
|
> ...
|
||||||
|
|
||||||
|
#Process:
|
||||||
|
- from the original nucleotide sequence string to nucleotide counts.
|
||||||
|
- from nucleotide counts to mass percentages.
|
||||||
|
- from the original nucleotide sequence string to codon triplets.
|
||||||
|
|
||||||
|
#Output:
|
||||||
|
|
||||||
|
For each nucleotide sequence:
|
||||||
|
- nucleotide counts
|
||||||
|
- Counts the occurrences of each of the four nucleotides ['A', 'C', 'G', 'T'].
|
||||||
|
- mass percentages
|
||||||
|
- Calculates the mass percentage occupied by each nucleotide type, rounded to one digit past the decimal point.
|
||||||
|
- codons
|
||||||
|
- Reports the codons (TAG) present in each sequence and
|
||||||
|
- protein-coding gene
|
||||||
|
- begins with a valid start codon ["ATG"]
|
||||||
|
- ends with a valid stop codon ["TAA", "TAG", or "TGA")
|
||||||
|
- contains at least 5 total codons (including its initial start codon and final stop codon)
|
||||||
|
- Cytosine (C) and Guanine (G) combined account for at least 30% of its total mass
|
||||||
|
|
||||||
|
##Example
|
||||||
|
|
||||||
|
> This program reports information about DNA
|
||||||
|
> nucleotide sequences that may encode
|
||||||
|
> proteins. Input file name? dna.txt
|
||||||
|
> Output file name? output.txt
|
||||||
|
> Output file output.txt after above execution (partial):
|
||||||
|
> Region Name: cure for cancer protein
|
||||||
|
> Nucleotides: ATGCCACTATGGTAG
|
||||||
|
> Nuc. Counts: [4, 3, 4, 4]
|
||||||
|
> Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8
|
||||||
|
> Codons List: [ATG, CCA, CTA, TGG, TAG]
|
||||||
|
> Is Protein?: YES
|
||||||
|
> ...
|
||||||
|
|
||||||
|
#Approach
|
||||||
|
|
||||||
|
##Constants
|
||||||
|
|
||||||
|
```java
|
||||||
|
int MIN_CODONS = 5; //the minimum number of codons a valid protein must have
|
||||||
|
int MIN_MASS_PERCENT = 30; // the percentage of mass from C and G in order for a protein to be valid
|
||||||
|
int UNIQUE_NUCLEOTIDES = 4; // the number of unique nucleotides (representing A, C, G, and T)
|
||||||
|
int CODONS_PER_NUCLEAOTIDE = 3; // the number of nucleotides per codon
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* begins with an introduction and prompts for input and output file names.
|
||||||
|
* reads the input file to process its nucleotide sequences.
|
||||||
|
* outputs the results into the given output file.
|
||||||
|
*
|
||||||
|
* @return void
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static void main(String[] args) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* assumes the user will type the name of an existing input file.
|
||||||
|
* input is in the proper format.
|
||||||
|
*
|
||||||
|
* @params console
|
||||||
|
* @return files array of input and output files for processing and saving
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String[] promptForFileNames(Scanner console) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* Converts char nucleotide to molar mass
|
||||||
|
*
|
||||||
|
* mass percentages, use the following as the mass of each nucleotide (grams/mol).
|
||||||
|
* "junk" regions are excluded from many parts of your computations, but they do contribute mass to the total.
|
||||||
|
* Adenine (A): 135.128
|
||||||
|
* Cytosine (C): 111.103
|
||||||
|
* Guanine (G): 151.128
|
||||||
|
* Thymine (T): 125.107
|
||||||
|
* Junk (-): 100.000
|
||||||
|
*
|
||||||
|
* @params nucleotide char of nucleotide.
|
||||||
|
* @return molarMass rounded to nearest tenth.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static double nucleotideToMolarMass(char nucleotide) {
|
||||||
|
double[] masses = {135.128, 111.103, 151.128, 125.107};
|
||||||
|
double rounded = Math.round(mass * 10.0) / 10.0;
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* Next, write code to pass over a nucleotide sequence and count the number of As, Cs, Gs, and Ts.
|
||||||
|
* use a String's charAt method to get individual characters.
|
||||||
|
*
|
||||||
|
* @params sequence sequence of
|
||||||
|
* @return counts array of size 4.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static int[] nucleotideCountFromSequence(String sequence) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* converts a single character (i.e. A, C, T, G) into indices (i.e. 0 to 3).
|
||||||
|
*
|
||||||
|
* @params nucleotide char of nucleotide.
|
||||||
|
* @return index int mapping of nucleotide.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static int nucleotideIndexFromChar(char nucleotide) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* eliminate these characters.
|
||||||
|
*
|
||||||
|
* @params sequence raw sequence
|
||||||
|
* @return sequence without junk DNA '-'.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String nucleotidesOnlyFromSequence(String sequence) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* break apart the sequence into codons and examine each codon.
|
||||||
|
*
|
||||||
|
* @params sequence String of nucleotides or raw.
|
||||||
|
* @return codons Array of strings of codons.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static String[] codonsFromSequence(String sequence) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
||||||
|
|
||||||
|
```java
|
||||||
|
/*
|
||||||
|
*
|
||||||
|
* Saves output to file using PrintStream as described in Section 6.4 of the textbook.
|
||||||
|
* overwrites any existing data in the output file (this is the default PrintStream behavior).
|
||||||
|
* nucleotide sequence is output in uppercase
|
||||||
|
* the nucleotide counts and mass percentages are shown in A, C, G, T order.
|
||||||
|
*
|
||||||
|
* @params path String path of output filename
|
||||||
|
* @return void;
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
public static void saveOutput(String path) {
|
||||||
|
|
||||||
|
}
|
||||||
|
```
|
|
@ -0,0 +1,18 @@
|
||||||
|
cure for cancer protein
|
||||||
|
ATGCCACTATGGTAG
|
||||||
|
captain picard hair growth protein
|
||||||
|
ATgCCAACATGgATGCCcGATAtGGATTgA
|
||||||
|
bogus protein
|
||||||
|
CCATtAATgATCaCAGTt
|
||||||
|
michael jordan mad hops protein
|
||||||
|
ATgAGATCCgtgatGTGggaTCCTaCTCATTaa
|
||||||
|
paris hilton phony protein
|
||||||
|
AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA
|
||||||
|
george w bush approval rating protein
|
||||||
|
atgataattagttttaatatcagactgtaa
|
||||||
|
jimi hendrix guitar talent protein
|
||||||
|
ATGCAATTGCTCGATTAG
|
||||||
|
tyler durden's brain protein
|
||||||
|
ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA
|
||||||
|
mini me growth hormone
|
||||||
|
AtGgGaCGCTgA
|
|
@ -0,0 +1,40 @@
|
||||||
|
thr operon leader peptide
|
||||||
|
ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA
|
||||||
|
aspartokinase I/homoserine dehydrogenase I
|
||||||
|
ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA
|
||||||
|
homoserine kinase
|
||||||
|
ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA
|
||||||
|
threonine synthase
|
||||||
|
ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA
|
||||||
|
hypothetical protein
|
||||||
|
AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA
|
||||||
|
Non-protein region
|
||||||
|
aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC
|
||||||
|
transaldolase B
|
||||||
|
ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA
|
||||||
|
molybdopterin biosynthesis mog protein
|
||||||
|
ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA
|
||||||
|
chaperone protein DnaK
|
||||||
|
aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA
|
||||||
|
chaperone protein DnaJ
|
||||||
|
GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA
|
||||||
|
hypothetical protein
|
||||||
|
TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA
|
||||||
|
hypothetical protein
|
||||||
|
aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA
|
||||||
|
putative secreted sulfatase
|
||||||
|
ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa
|
||||||
|
putative cytoplasmic protein
|
||||||
|
ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA
|
||||||
|
sodium/proton antiporter 1
|
||||||
|
GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA
|
||||||
|
transcriptional activator protein NhaR
|
||||||
|
ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA
|
||||||
|
riboflavin kinase
|
||||||
|
ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa
|
||||||
|
Isoleucyl-tRNA synthetase
|
||||||
|
ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA
|
||||||
|
Non-protein region
|
||||||
|
GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA
|
||||||
|
FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
|
||||||
|
ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA
|
|
@ -0,0 +1,63 @@
|
||||||
|
Region Name: cure for cancer protein
|
||||||
|
Nucleotides: ATGCCACTATGGTAG
|
||||||
|
Nuc. Counts: [4, 3, 4, 4]
|
||||||
|
Total Mass%: [27.32, 16.84, 30.55, 25.29] of 1978.76
|
||||||
|
Codons List: [ATG, CCA, CTA, TGG, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: captain picard hair growth protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
|
||||||
|
Nuc. Counts: [9, 6, 8, 7]
|
||||||
|
Total Mass%: [30.65, 16.8, 30.47, 22.07] of 3967.54
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: bogus protein
|
||||||
|
Nucleotides: CCATTAATGATCACAGTT
|
||||||
|
Nuc. Counts: [6, 4, 2, 6]
|
||||||
|
Total Mass%: [35.13, 19.25, 13.1, 32.52] of 2308.08
|
||||||
|
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: michael jordan mad hops protein
|
||||||
|
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
|
||||||
|
Nuc. Counts: [9, 6, 8, 10]
|
||||||
|
Total Mass%: [28.0, 15.35, 27.84, 28.81] of 4342.86
|
||||||
|
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: paris hilton phony protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
|
||||||
|
Nuc. Counts: [12, 6, 9, 9]
|
||||||
|
Total Mass%: [33.96, 13.96, 28.49, 23.58] of 4774.27
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: george w bush approval rating protein
|
||||||
|
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
|
||||||
|
Nuc. Counts: [12, 2, 4, 12]
|
||||||
|
Total Mass%: [41.06, 5.63, 15.31, 38.01] of 3949.54
|
||||||
|
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: jimi hendrix guitar talent protein
|
||||||
|
Nucleotides: ATGCAATTGCTCGATTAG
|
||||||
|
Nuc. Counts: [5, 3, 4, 6]
|
||||||
|
Total Mass%: [28.58, 14.1, 25.57, 31.75] of 2364.1
|
||||||
|
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: tyler durden's brain protein
|
||||||
|
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
|
||||||
|
Nuc. Counts: [24, 14, 16, 21]
|
||||||
|
Total Mass%: [32.95, 15.8, 24.56, 26.69] of 9843.81
|
||||||
|
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: mini me growth hormone
|
||||||
|
Nucleotides: ATGGGACGCTGA
|
||||||
|
Nuc. Counts: [3, 2, 5, 2]
|
||||||
|
Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.44
|
||||||
|
Codons List: [ATG, GGA, CGC, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
|
@ -0,0 +1,63 @@
|
||||||
|
Region Name: cure for cancer protein
|
||||||
|
Nucleotides: ATGCCACTATGGTAG
|
||||||
|
Nuc. Counts: [4, 3, 4, 4]
|
||||||
|
Total Mass%: [27.51, 16.96, 30.77, 25.47] of 1964.7
|
||||||
|
Codons List: [ATG, CCA, CTA, TGG, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: captain picard hair growth protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
|
||||||
|
Nuc. Counts: [9, 6, 8, 7]
|
||||||
|
Total Mass%: [30.76, 16.86, 30.58, 22.15] of 3953.5
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: bogus protein
|
||||||
|
Nucleotides: CCATTAATGATCACAGTT
|
||||||
|
Nuc. Counts: [6, 4, 2, 6]
|
||||||
|
Total Mass%: [35.56, 19.49, 13.26, 32.92] of 2280.1
|
||||||
|
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: michael jordan mad hops protein
|
||||||
|
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
|
||||||
|
Nuc. Counts: [9, 6, 8, 10]
|
||||||
|
Total Mass%: [28.37, 15.55, 28.2, 29.18] of 4286.8
|
||||||
|
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: paris hilton phony protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
|
||||||
|
Nuc. Counts: [12, 6, 9, 9]
|
||||||
|
Total Mass%: [34.27, 14.09, 28.74, 23.79] of 4732.2
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: george w bush approval rating protein
|
||||||
|
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
|
||||||
|
Nuc. Counts: [12, 2, 4, 12]
|
||||||
|
Total Mass%: [42.57, 5.83, 15.87, 39.41] of 3809.4
|
||||||
|
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: jimi hendrix guitar talent protein
|
||||||
|
Nucleotides: ATGCAATTGCTCGATTAG
|
||||||
|
Nuc. Counts: [5, 3, 4, 6]
|
||||||
|
Total Mass%: [29.1, 14.35, 26.03, 32.33] of 2322.0
|
||||||
|
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: tyler durden's brain protein
|
||||||
|
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
|
||||||
|
Nuc. Counts: [24, 14, 16, 21]
|
||||||
|
Total Mass%: [33.28, 15.96, 24.81, 26.96] of 9745.8
|
||||||
|
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: mini me growth hormone
|
||||||
|
Nucleotides: ATGGGACGCTGA
|
||||||
|
Nuc. Counts: [3, 2, 5, 2]
|
||||||
|
Total Mass%: [24.82, 13.6, 46.26, 15.32] of 1633.4
|
||||||
|
Codons List: [ATG, GGA, CGC, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
|
@ -0,0 +1,140 @@
|
||||||
|
Region Name: thr operon leader peptide
|
||||||
|
Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA
|
||||||
|
Nuc. Counts: [21, 22, 12, 11]
|
||||||
|
Total Mass%: [32.9, 28.34, 21.02, 15.95] of 8625.7
|
||||||
|
Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: aspartokinase I/homoserine dehydrogenase I
|
||||||
|
Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA
|
||||||
|
Nuc. Counts: [551, 608, 692, 612]
|
||||||
|
Total Mass%: [23.04, 20.91, 32.37, 23.7] of 323096.2
|
||||||
|
Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: homoserine kinase
|
||||||
|
Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA
|
||||||
|
Nuc. Counts: [193, 226, 295, 219]
|
||||||
|
Total Mass%: [21.16, 20.37, 36.17, 22.23] of 123268.3
|
||||||
|
Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: threonine synthase
|
||||||
|
Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA
|
||||||
|
Nuc. Counts: [309, 311, 358, 309]
|
||||||
|
Total Mass%: [24.69, 20.43, 32.0, 22.86] of 169097.5
|
||||||
|
Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA
|
||||||
|
Nuc. Counts: [66, 31, 43, 40]
|
||||||
|
Total Mass%: [37.57, 14.51, 27.37, 21.08] of 23739.3
|
||||||
|
Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Non-protein region
|
||||||
|
Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC
|
||||||
|
Nuc. Counts: [20, 13, 13, 5]
|
||||||
|
Total Mass%: [39.46, 21.09, 28.68, 9.13] of 6849.2
|
||||||
|
Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: transaldolase B
|
||||||
|
Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA
|
||||||
|
Nuc. Counts: [252, 236, 256, 210]
|
||||||
|
Total Mass%: [27.11, 20.88, 30.8, 20.92] of 125598.0
|
||||||
|
Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: molybdopterin biosynthesis mog protein
|
||||||
|
Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA
|
||||||
|
Nuc. Counts: [139, 143, 175, 131]
|
||||||
|
Total Mass%: [24.18, 20.45, 34.05, 21.1] of 77675.0
|
||||||
|
Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: chaperone protein DnaK
|
||||||
|
Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA
|
||||||
|
Nuc. Counts: [541, 475, 504, 397]
|
||||||
|
Total Mass%: [28.92, 20.88, 30.13, 19.65] of 252806.4
|
||||||
|
Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: chaperone protein DnaJ
|
||||||
|
Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA
|
||||||
|
Nuc. Counts: [287, 278, 352, 244]
|
||||||
|
Total Mass%: [25.2, 20.07, 34.57, 19.84] of 153867.6
|
||||||
|
Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA
|
||||||
|
Nuc. Counts: [58, 78, 69, 83]
|
||||||
|
Total Mass%: [21.04, 23.27, 28.0, 27.88] of 37245.0
|
||||||
|
Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA
|
||||||
|
Nuc. Counts: [214, 121, 184, 243]
|
||||||
|
Total Mass%: [29.25, 13.6, 28.13, 30.75] of 98860.9
|
||||||
|
Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: putative secreted sulfatase
|
||||||
|
Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA
|
||||||
|
Nuc. Counts: [440, 312, 362, 380]
|
||||||
|
Total Mass%: [30.43, 17.74, 28.0, 24.33] of 195417.1
|
||||||
|
Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: putative cytoplasmic protein
|
||||||
|
Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA
|
||||||
|
Nuc. Counts: [355, 273, 276, 356]
|
||||||
|
Total Mass%: [29.36, 18.56, 25.53, 27.26] of 163388.6
|
||||||
|
Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: sodium/proton antiporter 1
|
||||||
|
Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA
|
||||||
|
Nuc. Counts: [215, 258, 331, 363]
|
||||||
|
Total Mass%: [19.15, 18.9, 32.98, 29.94] of 151683.9
|
||||||
|
Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: transcriptional activator protein NhaR
|
||||||
|
Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA
|
||||||
|
Nuc. Counts: [228, 197, 232, 249]
|
||||||
|
Total Mass%: [26.07, 18.52, 29.67, 26.36] of 118181.6
|
||||||
|
Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: riboflavin kinase
|
||||||
|
Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA
|
||||||
|
Nuc. Counts: [213, 221, 276, 232]
|
||||||
|
Total Mass%: [23.23, 19.81, 33.66, 23.42] of 123918.1
|
||||||
|
Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Isoleucyl-tRNA synthetase
|
||||||
|
Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA
|
||||||
|
Nuc. Counts: [660, 720, 817, 620]
|
||||||
|
Total Mass%: [24.0, 21.53, 33.23, 20.87] of 371617.0
|
||||||
|
Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Non-protein region
|
||||||
|
Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA
|
||||||
|
Nuc. Counts: [46, 56, 49, 53]
|
||||||
|
Total Mass%: [23.44, 23.46, 27.93, 25.01] of 26515.7
|
||||||
|
Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
|
||||||
|
Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA
|
||||||
|
Nuc. Counts: [100, 121, 125, 104]
|
||||||
|
Total Mass%: [22.87, 22.75, 31.97, 22.02] of 59096.4
|
||||||
|
Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
|
@ -0,0 +1,18 @@
|
||||||
|
cure for cancer protein
|
||||||
|
ATGCCACTATGGTAG
|
||||||
|
captain picard hair growth protein
|
||||||
|
ATgCCAACATGgATGCCcGATAtGGATTgA
|
||||||
|
bogus protein
|
||||||
|
CCATtAATgATCaCAGTt
|
||||||
|
michael jordan mad hops protein
|
||||||
|
ATgAGATCCgtgatGTGggaTCCTaCTCATTaa
|
||||||
|
paris hilton phony protein
|
||||||
|
AtgCCaacaTGGATGCCCTAAGATAtgGATTagtgA
|
||||||
|
george w bush approval rating protein
|
||||||
|
atgataattagttttaatatcagactgtaa
|
||||||
|
jimi hendrix guitar talent protein
|
||||||
|
ATGCAATTGCTCGATTAG
|
||||||
|
tyler durden's brain protein
|
||||||
|
ATGATAcctatgagtaaTGTGGACCatatccaaACTATAGGCATtgtcggACCAACGATcgattggtTATACTGA
|
||||||
|
mini me growth hormone
|
||||||
|
AtGgGaCGCTgA
|
|
@ -0,0 +1,5 @@
|
||||||
|
This program reports information about DNA
|
||||||
|
nucleotide sequences that may encode proteins.
|
||||||
|
|
||||||
|
Input file name? dna.txt
|
||||||
|
Output file name? dna_file.txt
|
|
@ -0,0 +1,63 @@
|
||||||
|
Region Name: cure for cancer protein
|
||||||
|
Nucleotides: ATGCCACTATGGTAG
|
||||||
|
Nuc. Counts: [4, 3, 4, 4]
|
||||||
|
Total Mass%: [27.3, 16.8, 30.6, 25.3] of 1978.8
|
||||||
|
Codons List: [ATG, CCA, CTA, TGG, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: captain picard hair growth protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCGATATGGATTGA
|
||||||
|
Nuc. Counts: [9, 6, 8, 7]
|
||||||
|
Total Mass%: [30.7, 16.8, 30.5, 22.1] of 3967.5
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, GAT, ATG, GAT, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: bogus protein
|
||||||
|
Nucleotides: CCATTAATGATCACAGTT
|
||||||
|
Nuc. Counts: [6, 4, 2, 6]
|
||||||
|
Total Mass%: [35.1, 19.3, 13.1, 32.5] of 2308.1
|
||||||
|
Codons List: [CCA, TTA, ATG, ATC, ACA, GTT]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: michael jordan mad hops protein
|
||||||
|
Nucleotides: ATGAGATCCGTGATGTGGGATCCTACTCATTAA
|
||||||
|
Nuc. Counts: [9, 6, 8, 10]
|
||||||
|
Total Mass%: [28.0, 15.3, 27.8, 28.8] of 4342.9
|
||||||
|
Codons List: [ATG, AGA, TCC, GTG, ATG, TGG, GAT, CCT, ACT, CAT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: paris hilton phony protein
|
||||||
|
Nucleotides: ATGCCAACATGGATGCCCTAAGATATGGATTAGTGA
|
||||||
|
Nuc. Counts: [12, 6, 9, 9]
|
||||||
|
Total Mass%: [34.0, 14.0, 28.5, 23.6] of 4774.3
|
||||||
|
Codons List: [ATG, CCA, ACA, TGG, ATG, CCC, TAA, GAT, ATG, GAT, TAG, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: george w bush approval rating protein
|
||||||
|
Nucleotides: ATGATAATTAGTTTTAATATCAGACTGTAA
|
||||||
|
Nuc. Counts: [12, 2, 4, 12]
|
||||||
|
Total Mass%: [41.1, 5.6, 15.3, 38.0] of 3949.5
|
||||||
|
Codons List: [ATG, ATA, ATT, AGT, TTT, AAT, ATC, AGA, CTG, TAA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: jimi hendrix guitar talent protein
|
||||||
|
Nucleotides: ATGCAATTGCTCGATTAG
|
||||||
|
Nuc. Counts: [5, 3, 4, 6]
|
||||||
|
Total Mass%: [28.6, 14.1, 25.6, 31.8] of 2364.1
|
||||||
|
Codons List: [ATG, CAA, TTG, CTC, GAT, TAG]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: tyler durden's brain protein
|
||||||
|
Nucleotides: ATGATACCTATGAGTAATGTGGACCATATCCAAACTATAGGCATTGTCGGACCAACGATCGATTGGTTATACTGA
|
||||||
|
Nuc. Counts: [24, 14, 16, 21]
|
||||||
|
Total Mass%: [32.9, 15.8, 24.6, 26.7] of 9843.8
|
||||||
|
Codons List: [ATG, ATA, CCT, ATG, AGT, AAT, GTG, GAC, CAT, ATC, CAA, ACT, ATA, GGC, ATT, GTC, GGA, CCA, ACG, ATC, GAT, TGG, TTA, TAC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: mini me growth hormone
|
||||||
|
Nucleotides: ATGGGACGCTGA
|
||||||
|
Nuc. Counts: [3, 2, 5, 2]
|
||||||
|
Total Mass%: [24.8, 13.6, 46.3, 15.3] of 1633.4
|
||||||
|
Codons List: [ATG, GGA, CGC, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
|
@ -0,0 +1,40 @@
|
||||||
|
thr operon leader peptide
|
||||||
|
ATGAAACGCATTAGCaCCAcCATtACCACCaCCATCaCcATTACCACAGGTAACGGTGCGGGCTGA
|
||||||
|
aspartokinase I/homoserine dehydrogenase I
|
||||||
|
ATGCGAGtGTTGAAGTTcgGCGGTaCATCAgTGGCAAATGCAGAACGTtTTCTGCGGgTTGCCGATAttCTGGAAAGcAATGCCAGGCAGGGGCAGgTGGcCACCGTCCTCtCTGcCCCCGCCAAAATCACCAACCATCtGGTaGCGATGATtGaaAAaACCATtAGCGGTCAGGAtGCtTTaCcCaATATCAGCGATGCCGAACGTATTTTTGCCGAACTtCTGACgGGACTCGCCGCcGCCCAGcCGGGATTTCCGCTGGCACAAtTgAAAAcTTTCGTCGACCAgGAATTTGCCCAAATAAAACATGTcCtGCATGGCatCAGTTTGTTGGGGCAGTGCCCGGaTAGCATcAACGCTGCGCTGATTTGcCGTGgCGAGAAAaTGTcGaTcgCCattaTGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGgTCGAAaAAcTGCTgGCAGTGGGTCATTAcCtCgAaTCTACCGTTGATaTtGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCgGCTGACCACATgGtGCTGATGGCTGGTTTCACTGcCggTAATGAAAAAGgCGaGCTGGtGGTtCTGGGAcGCAACGGTTCCGACTaCTCCGCTGCGGTgCTGGCGGCcTGTTTaCGCGCCGATTGTTGcGAgaTCTGGACGGATGTTGAcGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGgAaGCGATGGAGCTTTCTTACTTCGGCGCTAAAgTTCTTCaCCCcCGCACCATTACCCCCATcGCCCAGtTCCAGATcCCTtgCCtGATTAAAAATAcCGgAAAtCCCCAAGCACCAGgTACGCtCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATcTGAATaACATGGCAATgTTCAGcGTTTCCGgCCCGGGGAtGAAAGGgATggTTgGCATGGCGGCGCGcgTCTTTGCAGcGaTGTCACGCGCCCGTaTTtCCGTGGTgCtGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCaAAGCGACTGTGTGCGAGCTgAaCGGGCAaTGcAGGAAGAGtTCTACCTGGAaCTGaAAGAAGGCTTACTGGAGCcGTTGGCgGtGACGGAACGGCTGGCCATTATCTcGGTGgTAGGTGATGGTATGCGcACCTtaCGTGGGAtCTCGgCGAAATtCTtTGCCGCGCTgGCcCGCGCCAATATCAACATTGTCgCCATTGCtCaGGGaTCTTcTGAaCGCTCAAtCTCTGTcGTGGTcAaTAACGATgATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGgCGTCGGTGGCGTTGgcGGTGCGCTGCTGgAGCAACTGAAGCGTCAgCAAAGCTGGTTGAAGAATAAaCATATCGaCTTACGTGTCTGCGGTGTTGCTAACTCGAAGgCACtgCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGgAAGAACTGGCGCAAGCcAAAGAGCCGTTTAATCTCGgGCGcTtAATTCGCCTCGTGAAAGAATATCATCTGCtGAaCCCGGTCATTgTTGACTgTACTTCCAgCCAGGCTGTgGCAGaTCAATATgCCGACTtCCTgCGCGAAGGTTTCCAcGTTGTtACGCCGAaCAAAaAGGCCaACACCTCGTcgATGGaTTACTaCCATCAGTtGCGTTATGCGGCGGAAAAATCGCGGCGTAaATTCCTCtATGACACcaACGTtGGGGCTGGATTACCGGTTATTgAGAACCTGCAAAATCTGCTCAATGCtGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTAtATCTTCGGCAAGTTAGACGAAGGCaTGAGTtTCTCCGAGgCGACCaCACTGGCGCGGGAAATGgGTTATACCGAACCGGAcCcGCGAGATGATCTTtCtGGTATGgAtGTGGCGCgTAagCTAtTGATtCTCGCTCGTGAAACGGGACGTGAACTGGAGCtGGCGGATATTGAAATTGAACCTgTGCTGCCCGCaGaGTTTAACGCCGAGGGTGATGTCGCcGCTTTTATGGCGAATCTGTCACAGCTCGACGaTCtCTTTGCCGCGCGTGTgGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATAttGATGAAGATgGCgTCTGCCGCGTGAAGaTTGCCGAAGTGGATGgTAATGaTCCGCTGTTCAAAGTGAaAaATGGCGaAAACGCCCTGGCCTTCTATAGCCACTATtATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCaATgACGTTaCAGCTGCCGGTgTCTTTGCTGATCTGCTACGtACCCTcTCAtGGaAGTTAGGAGTCTGA
|
||||||
|
homoserine kinase
|
||||||
|
ATgGTTAAAgTTTAtGCCCCGGCtTCCAGTGCCaATATGaGcGTCGgGTTTGATGTGCTCGGGgCGGCGGTGACACCTGTTGATGGTGCATTGCTCGgAGaTGTagTcaCGGTTGAGGCGGCAGAGACaTTCAgTCTCAACAACCTCGGACGCTTTGCCGAtAAGCTGCCGTCAGAGCCACGgGaaAATAtCGTTtATcAGTGcTGGGAGCGTtTTTGcCaGGAGCTTGGCAAGCAAATTCCAGTGGCGATGaCTCTGGAAAAGAATatGCCGAtCgGTTCGGGcTTAGGCTcCAGCGCCtGTTCAGTGGTCGCGGCgCTgAtGGCGATgAATGAAcACTGCGGCaAGCCGCTTAATGACACTCGTTTGCTGGCTTtGATGGgCGAgTTGGAAGGGcGTATCTCCGGCAGCAtTCATTACGACAACGtGGCACCGTGtTtTCtTGGTGGTAtGCAGTtgATGATCGAAGAaAACGACATCATCAGCCAGCAaGTGCCAGGGTTTGATGAGtGGCTGTGGGTGCTGGCGTATcCGGgGAtTAAAGTCtCGaCGGcAGAAGCCAGGGCTaTTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCAcGGGCgACATCTgGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATgAAAGaTGTTATCGCTGAACCCTACcGTGaACgGTTaCTGCCAGGCTTCCGGCAGGCGCGGcAGgCGGTTGCGGAAATCGGCGCGGTAgCGAGCGGTATCTCCGGCTCCGGCCCGAcTtTGTTCGCTCTGTGtGAcAAGCCGGATACCGCCCAGCGCGTTGCCGACTGgTTGGGTAAGAACtAcCTGCAAAATCAGgAAGGTTTTGTTcATATTTGCCGGCTGGATACGGCGGGcGCACGAgTACTGGAAAACTAA
|
||||||
|
threonine synthase
|
||||||
|
ATGAAACTCtacaATCTGAAAGATCACAATGAGCAGgTCaGCTTTGCGCAAGCCGTAACCCAGgGgTTAGGCAAAAATCAGGGgCtGTtTTTTCcgCACgaCCTGCCGGaaTTCAGCcTgACTGAAaTTGATGAGATgCTGAAGCtGGATTTTGTCACcCGCAGTGCGAAGATCCTcTCgGCGTTTATTGGTGATGAAATCCCGCAGGAAaTCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAaGCGATGTCGGTtGTCTGGAaTTGTTCcACGGGCcAACGCTGGCaTTTAAAGATTTCGGcGGTcGCTTTATGGCACAAATGCTgACCcATATTGCGGGCGATAAGCCAGTGAcCATTCTGACCGCGACATCCGGTgATACTGGaGCGGCAGTGGcTCATGcTTTCtACGGTtTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTgTTCTGTACATTGgGCggCAATATCGaAACTGTTGCCATCGAcggCGaTTTCGATGCCTGTCAGGCGCTGGTgAAGCAGGCgTTTGATGATGAAGAACTGAAAGTGgCgCtGGGGCtGAATTCTGCTAAcTCCATCAACaTCAGTCGCTTGCTGGCGcAGATTTGTTaTTAcTTTGaGGCTGTCGCACAGTtGCCGCAAGAAGCACGTAACCAGTTGgTTGTCTCGGTaCCGAGTGgAAACtTcGGCGATtTGACGGcGGGTCTGCTGGCGAaGTcACTCGGTCtGCCGGTAAAACGTtTTATTGCtgCGACCAACGTGAACGAtACCGTACCACGTTTCCTGCaCGaCGGTCAGTGGTCAcCCAAaGCGACTCAGgCGAcgTtaTCCAATGCGATGGATGTTAGCCAGCcAAaCAACTGGCCGCGTGTGGAAGAGTTGtTCcGCCGCAAAATCTGGCAACTGAAAGAGCTGGgTTATGCAGCCGTGgATGATGAAACCACGCAACAGACAATGcGTGAGtTAAaAGAACTGGGCTATACCTCGgAGCCGCACgCTGCCGTAGCTTATCGTGCGCTGCGTGACCAgTTGAAtCCAGGCGAATATGGCTTGTtCCTCGGcACcGCGCATCcGGcGAAatTtAAAgAGAGCGTGGAAGCGATTCTCGGTGAAAcGTTGGatCTGCCAAAAGAGCTGGCAGAACGTGCTgATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAatTgaTGATGAaTCATCAGTAA
|
||||||
|
hypothetical protein
|
||||||
|
AtGCAGCCcGGCTtTTTTTATGAAGAAAATaTGGAGaAaAACGACagGGAAAAAGGAGAAATTCtCAATAAATGCGGtAACTTAGAgATTaGGATTGCGGAGAATaACAACTGCcGTTCTCaTCGCGTAATCTCCGGATATCGACCCaTAACGGgCAATGATAAAAGgAGTAACCTGTGA
|
||||||
|
Non-protein region
|
||||||
|
aAAAACTgCTGGAAACAATGAAAGAcGTACCGGACGACCAAcGTCAGgCGC
|
||||||
|
transaldolase B
|
||||||
|
ATGACGGACAAATTGaCCTCcCTTCGTCAGTACACCACCGTAgTGGCCGACACTGGGGACATCGCGGCAATGAAGcTGTaTCAACcGCAGGATGCCACAACCAAcCCTtCTCTCATTCTTAACGCAGCGCAGATTCcGGAATACCGTAAgTTgATTGaTGATGCTGTCGCCTGGGcGAaACaGCAGAGCAAcGATcGCgCgCAGCAgATCGtGGACGCGACCGAcAAACTGGCAGTAaATATTgGTCTgGAAaTCCTGAAACTGgTTCCGgGCCgTATCTCAActGAAGTtGATGCGCGTCTTTCCTATGACaCCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGcAGGTaTTAGCAACGATCgTaTTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGcAGAACAGCTGGAAAAAGAaGGTATTAACTGTAAcCTGACCCTGCTgtTCTCctTCGCtCAGGcTCGTGCTTGTGCGGaAGCGGgCGTgTTCCTGaTCTCGcCGTTTgTTGGCcGTATTCTTGACTGGTAcAAaGCGAATACCGaTAAGAAAGAGtACGCTCcGGCAGAAGATcCGGGCGTGGTTTCTGTatCtGAAATCtACCAGtACTACaAAGAGCATGGTTaTgAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAAcTGGCAGGCTGCGACCGTCTGACCatCGCACCGgcACTGCTGAAAGAGCTGgCGGAGAGCGAAGGGGCTATCgAACGTAAACTgTCTTACAcTGgTGAAGTgAAAGCgCGTCCGGcGCGTATCACtGAGtCCGAGTTCCTgTGgCAgCACAACCAGGATCCAATGGCAGTaGATAAACTgGcGGaAGgTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCtGTAA
|
||||||
|
molybdopterin biosynthesis mog protein
|
||||||
|
ATGAATACTTTACGTATTGGCTTaGTtTcCaTCTCTGATCGCGCATCCAGCGGCGTTTAtCAGgaTAAAgGCATCCCTGCGCTGGAagAATGGCTGACAtcGGCGCTAACCACGcCGTTTGAaCTGGAAAcCCgCTTaATCCCCGATGAGCAGGCGATCATCGAGCAaACgTTgTGTGAGCTGGTGGATGAAaTGAGtTGCCaTCTGGTGCTCACCACGGGCGGAAcTGGCCCTGCGCGTCGTGAcgTAACGCcCGATGcGACGCTGGCAGTAGCGGACCGCGAGATgCcAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACcaaCTGCGATCCTTTCGCGTCAGGTggGGGTgATTCGCAAACAGGCGCTGATCCTTAACTTaCcCGGTCAACCGAAGtCTATTAAAGAGACGCtGgAAGGTGtGAAGGACGCTGAGgGTAAcGTTGTGGTGCACGgTATTTTTGCCaGCGTaCcGTaCTGCATTCAGTTGCTGGAAGGGCCATACGTTGAaACGGCaCCgGaAGTGGTTGCAGCATTCAGaCCGAAGAGTGCAaGACGCGAAGtTAGCGAATAA
|
||||||
|
chaperone protein DnaK
|
||||||
|
aTGGGTAAAATAaTTGGTATCGACcTGGGTACtACCAaCTCTTGTGTagCGaTTAtGGATGGCACCACTCCtCGTGtACTGgAGAACGcCGAAGGCGATCGCACCAcGcCTTcTATCATTgCCTATACCCAGGAtGGTGAAACTCTGGTTgGTCAGCCGGCTAAACGTCAGGCAgtGACGAACCCgCAaAACAcCCTGTtTGCGATTAAACGCCtGATTGGCCGCCgCTTCCAGgACgAAGAAGTACAGCGtGATgTTTcCATCATGCCGTTCAAAATTAtTGcTGCtgatAACGGCGACGcATGGGTCGAAGtTAAAgGCCAGAAAATGGCAcCGCCGcAGAtCTCTGCTGAAGTGCTGAAAAAAAtGAAGAAAACCGCTGAAGaTTAcCTGGgTGAAcCGGTAACTGaAGCTgtTATTACCGTACCGGCAtACTttaACGATGCTCAGCGTCAGGcAACCAAAGaCGCAGGCCGTATCGCTGGTCTGGAAGTAAAaCGTATCATCAACGAaCCGACCGCAGCTGCGCTGGCTtACGGtCTGGACAAAGgTACTGGCAACCgtACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTcCATTATCGAaATCGACGAAGTTGACGGCgAAAAAACCttCGAAGTTCTGGCAACCAACGGTGATACCCACCTGgGTGGtgAAGACTTCGACAGTCGTCTGATCAACTAtCTGGTTGAaGAATTCAAgAAAGATCAGGGCATTGacCtGCGCAACGaTcCGCTGGCAATGCAGCGCCTGAAaGAAGCGGCAGAAAAAGCgAAAATCGAACTGTctTCCGCTCAGcAGACCGaCGTTAACcTGCCGTACATCACTGCAGACGCGAcCGGTCCGAAACACAtGAACATCaAAgTGactCGTGCGAAACTGGAAAGCCTgGtTGAAGAtCTGGTAAACCGtTcCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATAtCGACgaCGTTATTCTCGTTGGTGGTCAGACTCGTATGCcAATGGtTCAGAAGAAAGTTGCTGaATTCTTTGGTAAAgAGCcGCGTAAAGATGTTAACCCGGACGAAGCTGTaGCCATCGgTGCTGCTGTTCAGGGTGGTGTTCTGACTGGtGAcGTAAAAGaCGTacTGCTgCtGGACGTTACCCCGCTGTCtCTGGGTATcGaAACCaTGGGCGGTGTGATGACCACGCTGATCGCgAaAAACACCACTATCCCGACCAaGcAcaGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATcCATgtGCTGcAGGGTGAACgTAaACGTGCgGCTGAtAAcaAATCTCTgggTCAGTTcAACCTGGATGGTATCAaCCCGGCACCGcGCGGCAtgCCGcAGATCGAAGtTACCtTCGAtATCGaTGCTGACGGTATCCTGCaCGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCAcTATCAaGGCTTCTTCTGGtCTGAaCGAAGAtGAAATCCAGAAAATGGTACGCGaCGCAGAAGCTAAcGCCGAAGCTGACCGTAaGTTTGAAGAGCTGGTACAGACtcGCaACCAGGGCGACCATCTGCTGCACAgCACCCGTAAGCAgGTTGAAGAAGCAGGCGACAaACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGActGCACTgGAAACtGCTCTGAAaGGTGAAGaCAAAGcCgCTATcGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCaGCAGCAACATGCcCAGCAGCAGACTGCCGGTGCTgATgCTTCtGCAAaCAAcGCGAAAGaTGACGATGTTGTCGACGCtGAATTTGAAGAAGTCAAAGACAAAAAATAA
|
||||||
|
chaperone protein DnaJ
|
||||||
|
GTGCatTCatCTAGGGGcAATTTAAAAAAGATGGCTAAGCAAGATTaTTACGAGaTTTTAGGCGTTTCCAAAaCAGCGGAAGAGCGtGAaaTCAAAAaGGCCTACAAACGCCTGGCCATGAAaTACCaCCCGGaCcGTAACCAGGgTGACAAAGaGGCCGAGGCGAAATTTAAAGAGATCAAGGaAGCTTATGAAGTTCTGACCGACtCGCAAAAACgTGCgGCATaCGATCAGTaTGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGcGGtTTTGGCGGCGGCgCAGACTTcAGCGATAtTTtTGGTGACGtTTTCGGCgATATTTTTGGcGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTAcGCTATAACATGGAGctCACcCtCGAAgAAGCTGTACGtgGCGtGaCCAAAGaGATccGCATtCCGACTCtGGAAGAGTGTGACGTTTGCCACgGTAGCgGTGCAAAACCaGGTACACAgCCgCAGACCTGTCCGACcTgTcATGGTTCTGGCCAGGtGCAGATGcGCCAGGGTTTCTTTGcCGTGCAGCAGACCTgTCcAcACTGTCAGGGCCGCGGTACGCTGaTcAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGtTGAGCgCaGCAAAACGCTGTCCGTTAAAATCCCGGCaGGGgTGGACACTGGAGaCCGCATCCGTCTTGCGgGCGAAGGTGAAGCGGGTGAACACGgCGCACCGGCAGGCGATCTgTACGTTCAGGTtCAGGTtAAACaGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGcGAAGTcCCGATCAAcTTCGCTATGgCGGCGcTGGGTGGTgaAATCGAAGTACcGACCcTTGATGGTcGcGTCaaACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAgCTGtTCCgTaTGCGCGGTAAAGGCGTCAAGTCtGTcCGCGGTGGcgCACAGGGTGATTtGCTATGCCGCGTTGTTGTCgaAACAcCGGTAGGTTTGAACgAGAAGCAGAAACAGCTGCTGCAAGaGctGCAAGAAAGCtTTGGTGGcCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCtTCTTtGATGGCGTGAaGAAGTTTTTTGACGaCCTgACTCGCTAA
|
||||||
|
hypothetical protein
|
||||||
|
TTGCTCTTaCTCGGATTCgTAAGCCGTGAAAACAGCAaCCTCCGtCTGGCCAGTTCGGATGTGAACCTCACAGAGgTCTTTTCTCGTTACCAgCGCCGCCACTACGGCGGTgATACAGATGACGATCAGgGcgACaAtcAtCgCcTTATGCTGCTTCATTGCTCtCTtCTCCTTGACCTTTCGGTCaGTAAGAgGCACTCTACATGTGTTCTGCATATAGgGGGCCTCGgGTtGATGgTAAAATAtCACTCGGGGCTTTTCTCTAtCTGCCGTTCAGCTAATgCcTGA
|
||||||
|
hypothetical protein
|
||||||
|
aTGTCTGCCAAaaGACGACTTCTTATTGCGtGTACCTTGAtAaCAGCTATcTATCAtTTTCCTGcaTATTCTTCATTAgAATATAAAGGAtCCTTTGGTTCAATaAATGCGGGTTAtGCAGACTGGAATAGTGGaTTTgTAAaCACTCACCGTGGTGAaGTATGGAAAGTGACtGCGGATTTTGGGgTaAATTTTAAAGAAGCAGAATTTTACTCAtTTTATgAaAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACgGtTTCAGCAATGaCGCATGTCAGACTCtTTGaCtCTGATaTGACATTCTTTGGCAAAATTTaTGgCCAATGGGATAACTCATgGggTGAcGATCTgGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCgAgTGGgGCTTTTtTAAACCGTATATTGGATtGCATAATCAATCTGGTGACTACGTATCAGCTAAATaTgGTCAAACGAATgGTTgGAATGGtTATGTTGTTGGCTGGACAGCAgTATTAcCATTTAcGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGaAATAGAACTGGACAGGaACGATGCTTACACGgAgCAGcAATTTGGCcGGAACGGgTTaAaTGGCGGtTTAACTATTGcCTGGAAGTTCTATCCTCGCTGGAAAGCCAGtGTGACGTGGCGTTATTTcGATAAtAaGCTGGGCTACGATGGCTTTgGcgaTCAAATGATTTAtATGCTTGgTTATGATTTCtAA
|
||||||
|
putative secreted sulfatase
|
||||||
|
ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAAtGCTTTTAGtCCTGCCTTAGCCGCAGAGGCTaAACAACcTAATTTAGTCATtaTTATGGCGGaTGATtTAGGTtaTGGCGAtTTAGcAaCaTATGGTCATCAGATCGTTAAAACACctAATATCGACAGGCtTGCCCAgGAAGGGGTCaAATTtACTGAcTaCTATGCCCCCGCTCCTTtAaGTTCAccTtCACGCGCaGGGCTATTAACCGGCcGGATGCCATTtCGTAcTGGAATTCGCTCATGGATtCCttCAGGCAAAGATGTTGCCtTAGGGCGTAACGAAcTCACgATTGCTAaTCTACTCAaAgCGCAaGGGTACGACACggCAATGATGGGTAAGCTGCATCTGAATgCAGGcGGCGaTCGCACCGATCAgCCaCAAGCACaAgATATGGGcTTTGATTAcTCAcTGGTtAATACgGCGGGCTTTGTTACcGACGCCACGCTGGATAAcGCTAAAGAACGCCcGCGTTATGGCATGGTTtAccCGACAGGCtgGCtACGTAACGGGCAACCCACTcCACGaGCTGATAAAAtGAGCGGTGAGTATGTCaGTTCGGAAGTCGTCAACTGGCTGGATAACAAAaaGGACaGCAAGCCTTTCTTCCTCTATgTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAaaATACCTCGATaTGTaCTCACaATATATGAGCGCGTATCAGAAGCAGcATCCTGATTTAtTTTaTGGCGACTGGGcAgACAAACCCTgGCGTgGTGTGGGgGAATATTAtGCCAATATCAGCTATCtGGATGCAcAGGTTGGAAAAgTGCTGGaTAAAATCAAAGCTGTGGgtGaAGaaGaTAACACAATCGTTATTTTTACCAGTGatAACGGTCCgGTAaCGCGTGAAGCGCGCAAAGTGTATgAGCTGAATTTGGCAGGGGAaACGGaTGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGtGTTCCaGCCATTATTAAATaTGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGtCTgGACTGGATGCCTACtTTaGCgAaAATGATGAACTTCAAATTACCTACAGAcCGTAcTTTCGATGgTGAATCGCTGGTTCCTGtTcTTGAGCaAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATgATCCAAcCGATGAATGGGCGATCCGTGATGgTGACTGGAAgAtGATTATCGATCGcaATAATAAACcGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAaCaCTTaAtCTGATCGGTAAAAAAACAgATATTGAAAAACAGATGTATGGTaAGtTTtTAAAATATAAAACTGATATTGATaATGATtCTCTAATGAAAgCCAGAGGTGATAAACCAGAAGCGGTGACCTggGGCTAa
|
||||||
|
putative cytoplasmic protein
|
||||||
|
ATGTTTACcAacGTAAATGTTGATTGtTgCAAAACACCAGGAtGTAAaaACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCAcAGgGTaAaAATATTTtATGCCGTGAATGTgGTTaCTTGTtTCCAGtGATATCTGAACAGTCGCTTAAtATTTaTCGTAATATTGTGAAtcACTcCTGGAGAGGTTTGATTTGCCAATGTTCAACTtGCGGAGGcACGTCCCTCAAAAAATaTGgATATtCtGCAcAagGCCAgAGAAGAATgTATTGCcaTCAtTGTGaGAAAACaTTtATCACTCTGGAAcAtGTAATTACcACACCACGAGGAGCcCTGTTAGcATTGATGATTGAGCAAGGGGAGGCACTTGCGGaTATCAgAAAGTCATTACGTCTTAACAgCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGcAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGtACCCGCGCTTtTCGcgTCAAGTAtAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGcGGCAGGGTgGTTGcCaTCTCAACCAATTACTCCCCATCtGCCGTAGagCaaCATTATcAATACaCATCGAACtATGAAGAGcGTATGTCTCCAGGGACGCTGGCACAtCATGTCCAGCGCAAAGAGttACTTACTATGCGGCgGGATACCTTGTTTGATATTGATTACGGCcCGgCAGTTTTACATCAAAACGATCCGGGAATGtTGGTAaAaCCGGTTCTTCCGGCATaTCGTCATTTTgAACTGGTCAGAATACTGACCGATGAGCATtCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATaTTGGGCGGCTGcCTGATGGCTAATTTGCAGCaTATTCATCAaGGTCGCTGCCATATTTCcTTTGTCAAaGAGCGcGGTGTGGCACCCGCCACCATTGaTTTTCCACCGCGATtATTCcTTAGTgGtGGgGTACgAAATAATGTCTGGCGTGCaTTTTCTAACCGCAATTATTCAaTGGCTGTATGCAAtCTCaCTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATtGAACAGTGCGACGCgTTtTATCCACTTTGTGgaGAACCATCCTTTCCTTATaTCATTGAACCGAATgtCTCCTGCGaaTGTCgtTTCTACaTTAGATaTCCTCAAACaTCTGTGGAATAaAaAACTAGagCATGGAACAATTtAA
|
||||||
|
sodium/proton antiporter 1
|
||||||
|
GTGAAACATCTGcATCGATTCTTTAGCaGTGATGCCTCGGGAGgCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTgcAaCCAGTGGATGGTATCACGACTTTCTTGAGACGCcGGTTCAGcTcCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGaCGCTCTGaTgGCGGTATTTTTCCTGTtGGTTGGTcTGGaAGTTAAAcGCGAGcTGaTGCAaGGTTCGCTGGCCAGTCtGCgCCAGGCGGCatTTCCTGTTATTGCCGcAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTtTtAACTATGCCGATCCGaTTaCCCGCGAAGGcTGGGCAatCCCGGCGGCGACTGacATTGCCTTTGCACTTggTgTGTTGGCGCTgTTGGGAAGTCGTGTTCCGTTAGCGCtGAAGATCTTTTtGATGGCTCTGGCtATTATCGACGATCTTgGGGcCATCATtATCATCGCATTGTTCTACAcTAATGACTTATCGATGGCCTcTCTTGGCGTcGCgGCTGTAGCAATTGCGgtACTCGCGGTATTGAAtCTGTgTGGTGTAcGCCGCACGGGCGTtTATATTCTGGTTGGCGTGGTGCtGTGGaCAGCGGTGTTGAAATCGGGGGTTCACGCAACCcTGGCTGGCGtCATtGtCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGgCGCTCTCcGgCTAAACGTCTGGAGCATGTTTTGCAtCCATGGGTGGCGTATCTGATtTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAaGGTgTCACGCtggAaGGTTTgACCtCCATTCTGCCATTAGgGATCATCGCTGGTTTGCTGaTTGGCaAGCCACtGGGTAtTaGTCTgttcTGCTGGtTGGcgCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACgACTtACCAGCAAATTATGGCGGtTGGTaTCcTGTGCGgTATCgGTTtTAcTatGTCTATCTTTATTGCCAGCCTGGcATTTGGTAgCGTAGATcCAGAaCTGaTTAACtGGGCAAAAtTAgGTATCCTTGTCGGTTCAATTTCtTcGgCGGTAATTGGATATAGcTGGTTACGcGTTCGTTTACGTCcATcAGTTTGA
|
||||||
|
transcriptional activator protein NhaR
|
||||||
|
ATGAGCATGTCTCATaTCAATTACAACCACTtGTATTACTTCTGGCaTGTCTAcAAAgAaGGTTCTGtGGTTGGCgCAGCGGAGGCGCTTTATTTAACAcCAcAAACCATTACCGGGCaGATCCGGGCGCTGGAaGAGCGCCTGCAAGGGAAAcTATTTAAGCGTAAAGGAcgTGGTCTGGAACCCAgcGAACTGGGGGAACTGGTCTATCGCtATGCCGATAAAATGTTCAcCTTAAgCCAGGAAATGCTgGATATCGTCAACTATCGCAAAGAGTCCAACTtATTGtTTGATGTTgGTGTGGCAGATGCACTTtcCAAAcGtcTGGTCAGCAGTGTTCtgGATgCCGCAGTtgTGGAAGACGAGCAGAtCCATCTACGCTGTTTCGAaTCGACGCACGAGATgCTTTTaGAGCAgtTGAGTCAGCATAaACTGGATATGATcaTCTCTGACTGTCCGaTCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAaTtGGCGAATGTGGTGTCAgtTTCTGGTgCACTAACCCACTACcAGAAAAGCCGTTTCCTGCCtGTCTTGAAgAGCgTCGtTtACTTATTCCGGGGCGTCGCTCAaTgTTGGGGCGtAAACTATTAAACTGGTTTAACTCcCAGGGCTTGAACGTCGAAATTTTGgGTGAGTTTGATGATGCTGCGTTGATGAAAgCCTTTGGGGCGAcGCATAACGcTATTTTCGTTGCACCTTCGCtTTACGCTAATgATTTCTATAACgATGACTCGgTtGTGgAGATAGgCCGTGTTGAGaACGTGATGGAAGAGTACCACGCGATTTtTGCCGaAAGgaTGAtTCAgCACCCTGcAGTAcAGCGTATCTGcAATACAgacTATTCTGCGCtgTTTACTCCAGCTTcAAAATAA
|
||||||
|
riboflavin kinase
|
||||||
|
ATGAAGCTGATACGCGgCAtACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTaATTTCGACGGCGTGCATCGCggTCATCGCGCGCTGTTACAGGGCtTGCAGGAAGAAGGGCGCAAGCGCAACtTACCGGTGATGGTGATGCTTTTtGaACCTCAACCAcTGGAACTGTTTGCTACTGAtAAAGCcCCGGCACGGcTcACcCGGCTGCgGGAAAAACTGCgTtaTcTTgCAGAgTGTGGCGTTGATTACGTGCTGTGCGtGCGTtTTGaCaGGCGTtTTGCGGCGTTAACCGCGcAAAACTTCATCAgTGATCTtCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGAtTTCCGCTTTggCGCTGgTCGTGAAgGCGAtTTCTtGTTATTACAGAaAGcgGGCATGGAATACGGCTTCGATATcACCAGCaCGCAAAcTTtTTGCGAAGGTGGTGTGCGtATCAGcAGCACCGCCGtgCGTCAGGCGCtTGCGgATgACAATCTGGCTCTGGCAGAAAGTTTACTGGgGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGaATTAGGGCGCAcTATAGGTTTCCCgACGGCGaATGTACCGcTaCgCCGTCAGGTTTCCCCGGTGAAAgGGGTTTATGCGGTAGaAgTgTTGGgCCtTGgCGAAaAGcCGTTAcCCGGcgTTGCAAACaTCGGAACACgCCCAACGGTTGCcGGTATTCGCCAGCAACTGgaAGTGCATTTGTTAGATGTTGcAATGGaCCTTTATGGTCGCCAtATACAAGTAGTGCTGCGtAAAAaAATAcGCAATGAGCAgCGATTTGcATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGcCCGCGaaTTTtTTGGGCTAAcAAAACCGGCTTAa
|
||||||
|
Isoleucyl-tRNA synthetase
|
||||||
|
ATGAGTGACTATAAATCaACCCTgAATTTGCCgGAAACAGgGTtCCCGATgCGTGGCGATCTCGcCAAGCGCGAAcCGGGaATGCTGGCGCGTTGGACTGATGATGATCTgTaCGGCATCATCCGTGCGGCTaAAAAAGGCAaAaAAACCTTCAtTCTGCATgATGGCCcTCCTTATGCGAATGGCAGCAtTCaTATTGGTcACTCGGTTAACAAGATTCTGAAAGACATTaTCATTaAgTCCAAAgGGCTttCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCaTGGtCTGCCAATCGAAcTGAAAGTAGAGCAAGAATACGGTAAGCCGGGgGAGaAaTTCACCGCCGcTGAGTtCCGCGCCAAGTGCCGCGAATACGCTGCgACCCAGGTTGACGGTCAGCGCAAAGACTTTaTCcGTCTGGGCGTGCTGGGCGActgGTCgcACCCGTACCTGACCATGGACtTCAAAACTGAAGCCAACATCATCCgCGCGCTGGGCAAAATCATCGGCAAcGGTCACCTGCACaAAGGcGCGAAGCCGGTgCACTGGTGCgTTGACTGCCGTTCTgCACTGGCAGAAGCGGAAGtTgAGTATTACGacAAAACTtCTCCGTCCATCGACGTCGCTTtCCAGGCGGTCGATCaGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATgTTAACGGCCCAATTTCGCtGGTTATCTGGaCcACCACGcCGTGgAcGCTGCcTGCTAacCGCgCAATCTCcATtGCACCTGATTTTGAttATGCGCTGGTGCaAatCgACGGTCAGgCCGTGATCCTCGCGAAAGATCtGGtTGaAAGCGTAAtGCAGCGTATCGGCGTTAGCGaTTACACCATTCTTGGCAcGGtgAAAGGTGCCGAGCtGGAACTGTTgCGCTTTACCCATCCGTTtATGGACtTCGATGTTCCGGCAaTTCTCGGCGACcACGTTACgCTGGATGCCGGTACCGGTGcCGTTCATACCGCGCCAGGCcACGGTCCGGaCGACTATgTGATCGGTcAAAAATaTGgTCTGGAAaCCGCTAACCCgGTTgGCcCGGACGgCACtTaTCTGCcGgGTACTTACCCGACTCtGGATgGCGTTaACGTCTTCAAAGCGAACGaTATTGTCATTGCGTTGTTgCAGGAAAAAGGcgCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTgCTGCtGGCGTCaTAAaACGCCGATCAtCTTCCGcgCGACGCCGCAGTGGTTCGTCAgCAtgGATCAGAAAGGTCTGCgTGCGcAGTCACTGAAAGAGATCAAAGGCgTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATcTCTCGTCaGCGTACCTGGGGcGTGCCgATGTCACTGTTCGTgCaCAaaGACACAGAAGAaCTGcATCCGCgTACTCtcGAACTGaTGGAAGAAGTGGcAAAACGCGTTgAAGTtGACgGCATTCAGGCgTGGTGGGATCTCGATGCGAAaGAgATCcTCGGCGaCGAAGCTGACCAGTATGTGAAAGTACCGGATACGCtGgATGTATGGTtTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTcCGGAATtTGCCGGTCACGCAGCGGACATGTaTcTGgAaGGTTCTGACCAACACcGTGgCTGGTtCATGTCtTCCCTGATGATCTCTACCGCGATGAAGGGcAAAGcGCCATATCGTCAGGTACTGACTCACGGCTTTAcCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGtAACaCcGTTTCGCCGCAGGATGTgATGAATAAACtGGGtGCGGATATTCTGCGTCTGTGGGTGGcATCAACCGACTAcACTGGCGAAATGGCcGtTTCTGACGAGATCcTGAAACGtGCTGCcGACAGCTATCGTCGTATCcGTAACAcCgCGCGCTTCCTGCTGGCAAACCTGAACgGTTtTGAtCCGGCaAAAGaTATGGTGAAACCGGAAGAGATGGTGGTaCTGGATCGCTGGGCCGtAGGTTGTGCGAAAGCGGCACAGGAAGACATCCtCAAGGCgTACGAAGCATACGATTTCcACGAAGTGGTaCAGCGTcTGaTGCGCtTCTGCTCCGTTGAGATGgGTTccTTCTACCTCGACATCATCAAAGACCGTCAgTATACcGCCAAAGCGGaCAGCGTGGCGCGTCGTAGCTGCCAGAcTgCGCTGTATCACATCGCaGAAGCGCTGGTTCGCTGGATGGCAcCAATCCTCTCCTTCaCcGCTGaTGAAGTGTGGGGtTaCCTGCCggGCGAACGTGAAAAATACGTCTTCAcCGGCgAgTGgTACGAAGGCCTGtTTGGTCTGGCAGACAGTGAAGCAATGAACGaTGCGTTCTGGGACGAGCTGTTGAAAGTGcGTGGCGAAGTGAAcAAAGTcaTTGAGCAAGCgCGTGCCGATAAGAACGTGGGcGGCTCGCTGGAAGCGGCAGTAAcCTTGTATGCAGAACCGGAaCTGGCgGCGAaaCTGaCCGcGCTGGGCGAtGAATTACGATTTGTCCTGtTGACCTCCGgCGCTAcCGTTGcAGACtATAACGACGCACCTGCTGATGCCCAGCAGaGCGAaGTcCTCAAAGGGCTGAAAgtCGCGTTGAGTAAAGCCgAAGGtGaGAAGTGTCCtcGctGCTGgCACTACACCcAGgATGTcGgCAAGGTGGCGGaACACGCAGAAATCTGCGGCCGCTGTgTcAgCaACGTCGCCGGTGACGGTGAAAAaCGTAAGTTTGCCTGA
|
||||||
|
Non-protein region
|
||||||
|
GCTTGCGCCAACGcCATTTCATCGCCATCCCGCCgAgcATACAGGCCTCGgAaGAACCAaTGGTGTTGGTGcCAACGGCCtGAccATTTTTcGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGcAGaTTGCGGATATTctTCTTTGTCGATCCAGTTTTTGTtAATGGAtAAAtCCA
|
||||||
|
FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
|
||||||
|
ATGTCTGAATCTGTACAGaGCAaTAgCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGAtGGCaCCAcCGCTGAGTCTACCCGCAaCAaCGGTAaACCGGCGCTGTTCCGCcTGgGTgATGCTTCTCTTTCTgAaGgGCTGGAGCAACACCTGCTgGGGCTGAAAGTGGgCGATAAAACCaCCTTCtCGCTGGAGCCAGATGCGGCgTTtgGCGTGCCGTcACCgGAcCTGATtCAGTAcTTCTCcCGCCGTGAATTTATGgATGCAGGCGAGCcaGAAATTGGCGCAATCATgCTTTTTACCGCAATGGaTGGCAGTGAGATGCCTGGCGTGaTCCGCgAAATTAACGGCGACTCCATTACCGTTGATTTCAACCaTCCGCTgGCCGGGCAGACCGTTCATTTTGATATTGaagTGCTGGaAATCGATCCGGCAcTGGAGGcGTaA
|
|
@ -0,0 +1,5 @@
|
||||||
|
This program reports information about DNA
|
||||||
|
nucleotide sequences that may encode proteins.
|
||||||
|
|
||||||
|
Input file name? ecoli.txt
|
||||||
|
Output file name? ecoli_file.txt
|
|
@ -0,0 +1,140 @@
|
||||||
|
Region Name: thr operon leader peptide
|
||||||
|
Nucleotides: ATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGA
|
||||||
|
Nuc. Counts: [21, 22, 12, 11]
|
||||||
|
Total Mass%: [33.5, 28.9, 21.4, 16.2] of 8471.7
|
||||||
|
Codons List: [ATG, AAA, CGC, ATT, AGC, ACC, ACC, ATT, ACC, ACC, ACC, ATC, ACC, ATT, ACC, ACA, GGT, AAC, GGT, GCG, GGC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: aspartokinase I/homoserine dehydrogenase I
|
||||||
|
Nucleotides: ATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCATCTGGTAGCGATGATTGAAAAAACCATTAGCGGTCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTTCCGCTGGCACAATTGAAAACTTTCGTCGACCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATCAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTGTTAGAAGCGCGTGGTCACAACGTTACCGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGTCATTACCTCGAATCTACCGTTGATATTGCTGAATCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGACCACATGGTGCTGATGGCTGGTTTCACTGCCGGTAATGAAAAAGGCGAGCTGGTGGTTCTGGGACGCAACGGTTCCGACTACTCCGCTGCGGTGCTGGCGGCCTGTTTACGCGCCGATTGTTGCGAGATCTGGACGGATGTTGACGGTGTTTATACCTGCGATCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAGTCGATGTCCTATCAGGAAGCGATGGAGCTTTCTTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTAAAAATACCGGAAATCCCCAAGCACCAGGTACGCTCATTGGTGCCAGCCGTGATGAAGACGAATTACCGGTCAAGGGCATTTCCAATCTGAATAACATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGGATGGTTGGCATGGCGGCGCGCGTCTTTGCAGCGATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTCCGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCGTTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTACGTGGGATCTCGGCGAAATTCTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCCATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGGTCAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTTGTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATATCGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCACTGCTCACCAATGTACATGGCCTTAATCTGGAAAACTGGCAGGAAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCGGTCATTGTTGACTGTACTTCCAGCCAGGCTGTGGCAGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTTACGCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCAGTTGCGTTATGCGGCGGAAAAATCGCGGCGTAAATTCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTGATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGCGACCACACTGGCGCGGGAAATGGGTTATACCGAACCGGACCCGCGAGATGATCTTTCTGGTATGGATGTGGCGCGTAAGCTATTGATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTTAACGCCGAGGGTGATGTCGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGTGTGGCGAAGGCCCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGGATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTCTATAGCCACTATTATCAGCCGCTGCCGTTGGTACTGCGCGGATATGGTGCGGGCAATGACGTTACAGCTGCCGGTGTCTTTGCTGATCTGCTACGTACCCTCTCATGGAAGTTAGGAGTCTGA
|
||||||
|
Nuc. Counts: [551, 608, 692, 612]
|
||||||
|
Total Mass%: [23.0, 20.9, 32.4, 23.7] of 323152.2
|
||||||
|
Codons List: [ATG, CGA, GTG, TTG, AAG, TTC, GGC, GGT, ACA, TCA, GTG, GCA, AAT, GCA, GAA, CGT, TTT, CTG, CGG, GTT, GCC, GAT, ATT, CTG, GAA, AGC, AAT, GCC, AGG, CAG, GGG, CAG, GTG, GCC, ACC, GTC, CTC, TCT, GCC, CCC, GCC, AAA, ATC, ACC, AAC, CAT, CTG, GTA, GCG, ATG, ATT, GAA, AAA, ACC, ATT, AGC, GGT, CAG, GAT, GCT, TTA, CCC, AAT, ATC, AGC, GAT, GCC, GAA, CGT, ATT, TTT, GCC, GAA, CTT, CTG, ACG, GGA, CTC, GCC, GCC, GCC, CAG, CCG, GGA, TTT, CCG, CTG, GCA, CAA, TTG, AAA, ACT, TTC, GTC, GAC, CAG, GAA, TTT, GCC, CAA, ATA, AAA, CAT, GTC, CTG, CAT, GGC, ATC, AGT, TTG, TTG, GGG, CAG, TGC, CCG, GAT, AGC, ATC, AAC, GCT, GCG, CTG, ATT, TGC, CGT, GGC, GAG, AAA, ATG, TCG, ATC, GCC, ATT, ATG, GCC, GGC, GTG, TTA, GAA, GCG, CGT, GGT, CAC, AAC, GTT, ACC, GTT, ATC, GAT, CCG, GTC, GAA, AAA, CTG, CTG, GCA, GTG, GGT, CAT, TAC, CTC, GAA, TCT, ACC, GTT, GAT, ATT, GCT, GAA, TCC, ACC, CGC, CGT, ATT, GCG, GCA, AGC, CGC, ATT, CCG, GCT, GAC, CAC, ATG, GTG, CTG, ATG, GCT, GGT, TTC, ACT, GCC, GGT, AAT, GAA, AAA, GGC, GAG, CTG, GTG, GTT, CTG, GGA, CGC, AAC, GGT, TCC, GAC, TAC, TCC, GCT, GCG, GTG, CTG, GCG, GCC, TGT, TTA, CGC, GCC, GAT, TGT, TGC, GAG, ATC, TGG, ACG, GAT, GTT, GAC, GGT, GTT, TAT, ACC, TGC, GAT, CCG, CGT, CAG, GTG, CCC, GAT, GCG, AGG, TTG, TTG, AAG, TCG, ATG, TCC, TAT, CAG, GAA, GCG, ATG, GAG, CTT, TCT, TAC, TTC, GGC, GCT, AAA, GTT, CTT, CAC, CCC, CGC, ACC, ATT, ACC, CCC, ATC, GCC, CAG, TTC, CAG, ATC, CCT, TGC, CTG, ATT, AAA, AAT, ACC, GGA, AAT, CCC, CAA, GCA, CCA, GGT, ACG, CTC, ATT, GGT, GCC, AGC, CGT, GAT, GAA, GAC, GAA, TTA, CCG, GTC, AAG, GGC, ATT, TCC, AAT, CTG, AAT, AAC, ATG, GCA, ATG, TTC, AGC, GTT, TCC, GGC, CCG, GGG, ATG, AAA, GGG, ATG, GTT, GGC, ATG, GCG, GCG, CGC, GTC, TTT, GCA, GCG, ATG, TCA, CGC, GCC, CGT, ATT, TCC, GTG, GTG, CTG, ATT, ACG, CAA, TCA, TCT, TCC, GAA, TAC, AGT, ATC, AGT, TTC, TGC, GTT, CCG, CAA, AGC, GAC, TGT, GTG, CGA, GCT, GAA, CGG, GCA, ATG, CAG, GAA, GAG, TTC, TAC, CTG, GAA, CTG, AAA, GAA, GGC, TTA, CTG, GAG, CCG, TTG, GCG, GTG, ACG, GAA, CGG, CTG, GCC, ATT, ATC, TCG, GTG, GTA, GGT, GAT, GGT, ATG, CGC, ACC, TTA, CGT, GGG, ATC, TCG, GCG, AAA, TTC, TTT, GCC, GCG, CTG, GCC, CGC, GCC, AAT, ATC, AAC, ATT, GTC, GCC, ATT, GCT, CAG, GGA, TCT, TCT, GAA, CGC, TCA, ATC, TCT, GTC, GTG, GTC, AAT, AAC, GAT, GAT, GCG, ACC, ACT, GGC, GTG, CGC, GTT, ACT, CAT, CAG, ATG, CTG, TTC, AAT, ACC, GAT, CAG, GTT, ATC, GAA, GTG, TTT, GTG, ATT, GGC, GTC, GGT, GGC, GTT, GGC, GGT, GCG, CTG, CTG, GAG, CAA, CTG, AAG, CGT, CAG, CAA, AGC, TGG, TTG, AAG, AAT, AAA, CAT, ATC, GAC, TTA, CGT, GTC, TGC, GGT, GTT, GCT, AAC, TCG, AAG, GCA, CTG, CTC, ACC, AAT, GTA, CAT, GGC, CTT, AAT, CTG, GAA, AAC, TGG, CAG, GAA, GAA, CTG, GCG, CAA, GCC, AAA, GAG, CCG, TTT, AAT, CTC, GGG, CGC, TTA, ATT, CGC, CTC, GTG, AAA, GAA, TAT, CAT, CTG, CTG, AAC, CCG, GTC, ATT, GTT, GAC, TGT, ACT, TCC, AGC, CAG, GCT, GTG, GCA, GAT, CAA, TAT, GCC, GAC, TTC, CTG, CGC, GAA, GGT, TTC, CAC, GTT, GTT, ACG, CCG, AAC, AAA, AAG, GCC, AAC, ACC, TCG, TCG, ATG, GAT, TAC, TAC, CAT, CAG, TTG, CGT, TAT, GCG, GCG, GAA, AAA, TCG, CGG, CGT, AAA, TTC, CTC, TAT, GAC, ACC, AAC, GTT, GGG, GCT, GGA, TTA, CCG, GTT, ATT, GAG, AAC, CTG, CAA, AAT, CTG, CTC, AAT, GCT, GGT, GAT, GAA, TTG, ATG, AAG, TTC, TCC, GGC, ATT, CTT, TCA, GGT, TCG, CTT, TCT, TAT, ATC, TTC, GGC, AAG, TTA, GAC, GAA, GGC, ATG, AGT, TTC, TCC, GAG, GCG, ACC, ACA, CTG, GCG, CGG, GAA, ATG, GGT, TAT, ACC, GAA, CCG, GAC, CCG, CGA, GAT, GAT, CTT, TCT, GGT, ATG, GAT, GTG, GCG, CGT, AAG, CTA, TTG, ATT, CTC, GCT, CGT, GAA, ACG, GGA, CGT, GAA, CTG, GAG, CTG, GCG, GAT, ATT, GAA, ATT, GAA, CCT, GTG, CTG, CCC, GCA, GAG, TTT, AAC, GCC, GAG, GGT, GAT, GTC, GCC, GCT, TTT, ATG, GCG, AAT, CTG, TCA, CAG, CTC, GAC, GAT, CTC, TTT, GCC, GCG, CGT, GTG, GCG, AAG, GCC, CGT, GAT, GAA, GGA, AAA, GTT, TTG, CGC, TAT, GTT, GGC, AAT, ATT, GAT, GAA, GAT, GGC, GTC, TGC, CGC, GTG, AAG, ATT, GCC, GAA, GTG, GAT, GGT, AAT, GAT, CCG, CTG, TTC, AAA, GTG, AAA, AAT, GGC, GAA, AAC, GCC, CTG, GCC, TTC, TAT, AGC, CAC, TAT, TAT, CAG, CCG, CTG, CCG, TTG, GTA, CTG, CGC, GGA, TAT, GGT, GCG, GGC, AAT, GAC, GTT, ACA, GCT, GCC, GGT, GTC, TTT, GCT, GAT, CTG, CTA, CGT, ACC, CTC, TCA, TGG, AAG, TTA, GGA, GTC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: homoserine kinase
|
||||||
|
Nucleotides: ATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGGGCGGCGGTGACACCTGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGGCGGCAGAGACATTCAGTCTCAACAACCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAGCCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGGAGCTTGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGTTCAGTGGTCGCGGCGCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACTCGTTTGCTGGCTTTGATGGGCGAGTTGGAAGGGCGTATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGATCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAAGTCTCGACGGCAGAAGCCAGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACATCTGGCAGGCTTCATTCACGCCTGCTATTCCCGTCAGCTTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCTGAACCCTACCGTGAACGGTTACTGCCAGGCTTCCGGCAGGCGCGGCAGGCGGTTGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGCTCCGGCCCGACTTTGTTCGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCTGCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAA
|
||||||
|
Nuc. Counts: [193, 226, 295, 219]
|
||||||
|
Total Mass%: [21.2, 20.4, 36.2, 22.2] of 123170.2
|
||||||
|
Codons List: [ATG, GTT, AAA, GTT, TAT, GCC, CCG, GCT, TCC, AGT, GCC, AAT, ATG, AGC, GTC, GGG, TTT, GAT, GTG, CTC, GGG, GCG, GCG, GTG, ACA, CCT, GTT, GAT, GGT, GCA, TTG, CTC, GGA, GAT, GTA, GTC, ACG, GTT, GAG, GCG, GCA, GAG, ACA, TTC, AGT, CTC, AAC, AAC, CTC, GGA, CGC, TTT, GCC, GAT, AAG, CTG, CCG, TCA, GAG, CCA, CGG, GAA, AAT, ATC, GTT, TAT, CAG, TGC, TGG, GAG, CGT, TTT, TGC, CAG, GAG, CTT, GGC, AAG, CAA, ATT, CCA, GTG, GCG, ATG, ACT, CTG, GAA, AAG, AAT, ATG, CCG, ATC, GGT, TCG, GGC, TTA, GGC, TCC, AGC, GCC, TGT, TCA, GTG, GTC, GCG, GCG, CTG, ATG, GCG, ATG, AAT, GAA, CAC, TGC, GGC, AAG, CCG, CTT, AAT, GAC, ACT, CGT, TTG, CTG, GCT, TTG, ATG, GGC, GAG, TTG, GAA, GGG, CGT, ATC, TCC, GGC, AGC, ATT, CAT, TAC, GAC, AAC, GTG, GCA, CCG, TGT, TTT, CTT, GGT, GGT, ATG, CAG, TTG, ATG, ATC, GAA, GAA, AAC, GAC, ATC, ATC, AGC, CAG, CAA, GTG, CCA, GGG, TTT, GAT, GAG, TGG, CTG, TGG, GTG, CTG, GCG, TAT, CCG, GGG, ATT, AAA, GTC, TCG, ACG, GCA, GAA, GCC, AGG, GCT, ATT, TTA, CCG, GCG, CAG, TAT, CGC, CGC, CAG, GAT, TGC, ATT, GCG, CAC, GGG, CGA, CAT, CTG, GCA, GGC, TTC, ATT, CAC, GCC, TGC, TAT, TCC, CGT, CAG, CTT, GAG, CTT, GCC, GCG, AAG, CTG, ATG, AAA, GAT, GTT, ATC, GCT, GAA, CCC, TAC, CGT, GAA, CGG, TTA, CTG, CCA, GGC, TTC, CGG, CAG, GCG, CGG, CAG, GCG, GTT, GCG, GAA, ATC, GGC, GCG, GTA, GCG, AGC, GGT, ATC, TCC, GGC, TCC, GGC, CCG, ACT, TTG, TTC, GCT, CTG, TGT, GAC, AAG, CCG, GAT, ACC, GCC, CAG, CGC, GTT, GCC, GAC, TGG, TTG, GGT, AAG, AAC, TAC, CTG, CAA, AAT, CAG, GAA, GGT, TTT, GTT, CAT, ATT, TGC, CGG, CTG, GAT, ACG, GCG, GGC, GCA, CGA, GTA, CTG, GAA, AAC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: threonine synthase
|
||||||
|
Nucleotides: ATGAAACTCTACAATCTGAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTAGGCAAAAATCAGGGGCTGTTTTTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAAGATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTACGTGCGGCGTTTGCCTTCCCGGCTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGCGGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACATCCGGTGATACTGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTCTATCCACGAGGCAAAATCAGTCCACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAGGCGCTGGTGAAGCAGGCGTTTGATGATGAAGAACTGAAAGTGGCGCTGGGGCTGAATTCTGCTAACTCCATCAACATCAGTCGCTTGCTGGCGCAGATTTGTTATTACTTTGAGGCTGTCGCACAGTTGCCGCAAGAAGCACGTAACCAGTTGGTTGTCTCGGTACCGAGTGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTAAAACGTTTTATTGCTGCGACCAACGTGAACGATACCGTACCACGTTTCCTGCACGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTTATCCAATGCGATGGATGTTAGCCAGCCAAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGAAAGAGCTGGGTTATGCAGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTATACCTCGGAGCCGCACGCTGCCGTAGCTTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGCGCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTGCTGATTTACCCTTGCTTTCGCATAACCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAA
|
||||||
|
Nuc. Counts: [309, 311, 358, 309]
|
||||||
|
Total Mass%: [24.7, 20.4, 32.0, 22.9] of 169069.5
|
||||||
|
Codons List: [ATG, AAA, CTC, TAC, AAT, CTG, AAA, GAT, CAC, AAT, GAG, CAG, GTC, AGC, TTT, GCG, CAA, GCC, GTA, ACC, CAG, GGG, TTA, GGC, AAA, AAT, CAG, GGG, CTG, TTT, TTT, CCG, CAC, GAC, CTG, CCG, GAA, TTC, AGC, CTG, ACT, GAA, ATT, GAT, GAG, ATG, CTG, AAG, CTG, GAT, TTT, GTC, ACC, CGC, AGT, GCG, AAG, ATC, CTC, TCG, GCG, TTT, ATT, GGT, GAT, GAA, ATC, CCG, CAG, GAA, ATC, CTG, GAA, GAG, CGC, GTA, CGT, GCG, GCG, TTT, GCC, TTC, CCG, GCT, CCG, GTC, GCC, AAT, GTT, GAA, AGC, GAT, GTC, GGT, TGT, CTG, GAA, TTG, TTC, CAC, GGG, CCA, ACG, CTG, GCA, TTT, AAA, GAT, TTC, GGC, GGT, CGC, TTT, ATG, GCA, CAA, ATG, CTG, ACC, CAT, ATT, GCG, GGC, GAT, AAG, CCA, GTG, ACC, ATT, CTG, ACC, GCG, ACA, TCC, GGT, GAT, ACT, GGA, GCG, GCA, GTG, GCT, CAT, GCT, TTC, TAC, GGT, TTA, CCG, AAT, GTG, AAA, GTG, GTT, ATC, CTC, TAT, CCA, CGA, GGC, AAA, ATC, AGT, CCA, CTG, CAA, GAA, AAA, CTG, TTC, TGT, ACA, TTG, GGC, GGC, AAT, ATC, GAA, ACT, GTT, GCC, ATC, GAC, GGC, GAT, TTC, GAT, GCC, TGT, CAG, GCG, CTG, GTG, AAG, CAG, GCG, TTT, GAT, GAT, GAA, GAA, CTG, AAA, GTG, GCG, CTG, GGG, CTG, AAT, TCT, GCT, AAC, TCC, ATC, AAC, ATC, AGT, CGC, TTG, CTG, GCG, CAG, ATT, TGT, TAT, TAC, TTT, GAG, GCT, GTC, GCA, CAG, TTG, CCG, CAA, GAA, GCA, CGT, AAC, CAG, TTG, GTT, GTC, TCG, GTA, CCG, AGT, GGA, AAC, TTC, GGC, GAT, TTG, ACG, GCG, GGT, CTG, CTG, GCG, AAG, TCA, CTC, GGT, CTG, CCG, GTA, AAA, CGT, TTT, ATT, GCT, GCG, ACC, AAC, GTG, AAC, GAT, ACC, GTA, CCA, CGT, TTC, CTG, CAC, GAC, GGT, CAG, TGG, TCA, CCC, AAA, GCG, ACT, CAG, GCG, ACG, TTA, TCC, AAT, GCG, ATG, GAT, GTT, AGC, CAG, CCA, AAC, AAC, TGG, CCG, CGT, GTG, GAA, GAG, TTG, TTC, CGC, CGC, AAA, ATC, TGG, CAA, CTG, AAA, GAG, CTG, GGT, TAT, GCA, GCC, GTG, GAT, GAT, GAA, ACC, ACG, CAA, CAG, ACA, ATG, CGT, GAG, TTA, AAA, GAA, CTG, GGC, TAT, ACC, TCG, GAG, CCG, CAC, GCT, GCC, GTA, GCT, TAT, CGT, GCG, CTG, CGT, GAC, CAG, TTG, AAT, CCA, GGC, GAA, TAT, GGC, TTG, TTC, CTC, GGC, ACC, GCG, CAT, CCG, GCG, AAA, TTT, AAA, GAG, AGC, GTG, GAA, GCG, ATT, CTC, GGT, GAA, ACG, TTG, GAT, CTG, CCA, AAA, GAG, CTG, GCA, GAA, CGT, GCT, GAT, TTA, CCC, TTG, CTT, TCG, CAT, AAC, CTG, CCC, GCC, GAT, TTT, GCT, GCG, TTG, CGT, AAA, TTG, ATG, ATG, AAT, CAT, CAG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: ATGCAGCCCGGCTTTTTTTATGAAGAAAATATGGAGAAAAACGACAGGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACTGCCGTTCTCATCGCGTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGA
|
||||||
|
Nuc. Counts: [66, 31, 43, 40]
|
||||||
|
Total Mass%: [37.4, 14.4, 27.2, 21.0] of 23865.4
|
||||||
|
Codons List: [ATG, CAG, CCC, GGC, TTT, TTT, TAT, GAA, GAA, AAT, ATG, GAG, AAA, AAC, GAC, AGG, GAA, AAA, GGA, GAA, ATT, CTC, AAT, AAA, TGC, GGT, AAC, TTA, GAG, ATT, AGG, ATT, GCG, GAG, AAT, AAC, AAC, TGC, CGT, TCT, CAT, CGC, GTA, ATC, TCC, GGA, TAT, CGA, CCC, ATA, ACG, GGC, AAT, GAT, AAA, AGG, AGT, AAC, CTG, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Non-protein region
|
||||||
|
Nucleotides: AAAAACTGCTGGAAACAATGAAAGACGTACCGGACGACCAACGTCAGGCGC
|
||||||
|
Nuc. Counts: [20, 13, 13, 5]
|
||||||
|
Total Mass%: [40.1, 21.4, 29.2, 9.3] of 6737.1
|
||||||
|
Codons List: [AAA, AAC, TGC, TGG, AAA, CAA, TGA, AAG, ACG, TAC, CGG, ACG, ACC, AAC, GTC, AGG, CGC]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: transaldolase B
|
||||||
|
Nucleotides: ATGACGGACAAATTGACCTCCCTTCGTCAGTACACCACCGTAGTGGCCGACACTGGGGACATCGCGGCAATGAAGCTGTATCAACCGCAGGATGCCACAACCAACCCTTCTCTCATTCTTAACGCAGCGCAGATTCCGGAATACCGTAAGTTGATTGATGATGCTGTCGCCTGGGCGAAACAGCAGAGCAACGATCGCGCGCAGCAGATCGTGGACGCGACCGACAAACTGGCAGTAAATATTGGTCTGGAAATCCTGAAACTGGTTCCGGGCCGTATCTCAACTGAAGTTGATGCGCGTCTTTCCTATGACACCGAAGCGTCAATTGCGAAAGCAAAACGCCTGATCAAACTCTACAACGATGCAGGTATTAGCAACGATCGTATTCTGATCAAACTGGCTTCTACCTGGCAGGGTATCCGTGCTGCAGAACAGCTGGAAAAAGAAGGTATTAACTGTAACCTGACCCTGCTGTTCTCCTTCGCTCAGGCTCGTGCTTGTGCGGAAGCGGGCGTGTTCCTGATCTCGCCGTTTGTTGGCCGTATTCTTGACTGGTACAAAGCGAATACCGATAAGAAAGAGTACGCTCCGGCAGAAGATCCGGGCGTGGTTTCTGTATCTGAAATCTACCAGTACTACAAAGAGCATGGTTATGAAACCGTGGTTATGGGCGCAAGCTTCCGTAACATCGGCGAAATTCTGGAACTGGCAGGCTGCGACCGTCTGACCATCGCACCGGCACTGCTGAAAGAGCTGGCGGAGAGCGAAGGGGCTATCGAACGTAAACTGTCTTACACTGGTGAAGTGAAAGCGCGTCCGGCGCGTATCACTGAGTCCGAGTTCCTGTGGCAGCACAACCAGGATCCAATGGCAGTAGATAAACTGGCGGAAGGTATCCGTAAGTTTGCTGTTGACCAGGAAAAACTGGAAAAAATGATCGGCGATCTGCTGTAA
|
||||||
|
Nuc. Counts: [252, 236, 256, 210]
|
||||||
|
Total Mass%: [27.2, 20.9, 30.9, 21.0] of 125233.8
|
||||||
|
Codons List: [ATG, ACG, GAC, AAA, TTG, ACC, TCC, CTT, CGT, CAG, TAC, ACC, ACC, GTA, GTG, GCC, GAC, ACT, GGG, GAC, ATC, GCG, GCA, ATG, AAG, CTG, TAT, CAA, CCG, CAG, GAT, GCC, ACA, ACC, AAC, CCT, TCT, CTC, ATT, CTT, AAC, GCA, GCG, CAG, ATT, CCG, GAA, TAC, CGT, AAG, TTG, ATT, GAT, GAT, GCT, GTC, GCC, TGG, GCG, AAA, CAG, CAG, AGC, AAC, GAT, CGC, GCG, CAG, CAG, ATC, GTG, GAC, GCG, ACC, GAC, AAA, CTG, GCA, GTA, AAT, ATT, GGT, CTG, GAA, ATC, CTG, AAA, CTG, GTT, CCG, GGC, CGT, ATC, TCA, ACT, GAA, GTT, GAT, GCG, CGT, CTT, TCC, TAT, GAC, ACC, GAA, GCG, TCA, ATT, GCG, AAA, GCA, AAA, CGC, CTG, ATC, AAA, CTC, TAC, AAC, GAT, GCA, GGT, ATT, AGC, AAC, GAT, CGT, ATT, CTG, ATC, AAA, CTG, GCT, TCT, ACC, TGG, CAG, GGT, ATC, CGT, GCT, GCA, GAA, CAG, CTG, GAA, AAA, GAA, GGT, ATT, AAC, TGT, AAC, CTG, ACC, CTG, CTG, TTC, TCC, TTC, GCT, CAG, GCT, CGT, GCT, TGT, GCG, GAA, GCG, GGC, GTG, TTC, CTG, ATC, TCG, CCG, TTT, GTT, GGC, CGT, ATT, CTT, GAC, TGG, TAC, AAA, GCG, AAT, ACC, GAT, AAG, AAA, GAG, TAC, GCT, CCG, GCA, GAA, GAT, CCG, GGC, GTG, GTT, TCT, GTA, TCT, GAA, ATC, TAC, CAG, TAC, TAC, AAA, GAG, CAT, GGT, TAT, GAA, ACC, GTG, GTT, ATG, GGC, GCA, AGC, TTC, CGT, AAC, ATC, GGC, GAA, ATT, CTG, GAA, CTG, GCA, GGC, TGC, GAC, CGT, CTG, ACC, ATC, GCA, CCG, GCA, CTG, CTG, AAA, GAG, CTG, GCG, GAG, AGC, GAA, GGG, GCT, ATC, GAA, CGT, AAA, CTG, TCT, TAC, ACT, GGT, GAA, GTG, AAA, GCG, CGT, CCG, GCG, CGT, ATC, ACT, GAG, TCC, GAG, TTC, CTG, TGG, CAG, CAC, AAC, CAG, GAT, CCA, ATG, GCA, GTA, GAT, AAA, CTG, GCG, GAA, GGT, ATC, CGT, AAG, TTT, GCT, GTT, GAC, CAG, GAA, AAA, CTG, GAA, AAA, ATG, ATC, GGC, GAT, CTG, CTG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: molybdopterin biosynthesis mog protein
|
||||||
|
Nucleotides: ATGAATACTTTACGTATTGGCTTAGTTTCCATCTCTGATCGCGCATCCAGCGGCGTTTATCAGGATAAAGGCATCCCTGCGCTGGAAGAATGGCTGACATCGGCGCTAACCACGCCGTTTGAACTGGAAACCCGCTTAATCCCCGATGAGCAGGCGATCATCGAGCAAACGTTGTGTGAGCTGGTGGATGAAATGAGTTGCCATCTGGTGCTCACCACGGGCGGAACTGGCCCTGCGCGTCGTGACGTAACGCCCGATGCGACGCTGGCAGTAGCGGACCGCGAGATGCCAGGCTTTGGTGAACAGATGCGCCAGATCAGCCTGCATTTTGTACCAACTGCGATCCTTTCGCGTCAGGTGGGGGTGATTCGCAAACAGGCGCTGATCCTTAACTTACCCGGTCAACCGAAGTCTATTAAAGAGACGCTGGAAGGTGTGAAGGACGCTGAGGGTAACGTTGTGGTGCACGGTATTTTTGCCAGCGTACCGTACTGCATTCAGTTGCTGGAAGGGCCATACGTTGAAACGGCACCGGAAGTGGTTGCAGCATTCAGACCGAAGAGTGCAAGACGCGAAGTTAGCGAATAA
|
||||||
|
Nuc. Counts: [139, 143, 175, 131]
|
||||||
|
Total Mass%: [24.2, 20.5, 34.1, 21.1] of 77506.9
|
||||||
|
Codons List: [ATG, AAT, ACT, TTA, CGT, ATT, GGC, TTA, GTT, TCC, ATC, TCT, GAT, CGC, GCA, TCC, AGC, GGC, GTT, TAT, CAG, GAT, AAA, GGC, ATC, CCT, GCG, CTG, GAA, GAA, TGG, CTG, ACA, TCG, GCG, CTA, ACC, ACG, CCG, TTT, GAA, CTG, GAA, ACC, CGC, TTA, ATC, CCC, GAT, GAG, CAG, GCG, ATC, ATC, GAG, CAA, ACG, TTG, TGT, GAG, CTG, GTG, GAT, GAA, ATG, AGT, TGC, CAT, CTG, GTG, CTC, ACC, ACG, GGC, GGA, ACT, GGC, CCT, GCG, CGT, CGT, GAC, GTA, ACG, CCC, GAT, GCG, ACG, CTG, GCA, GTA, GCG, GAC, CGC, GAG, ATG, CCA, GGC, TTT, GGT, GAA, CAG, ATG, CGC, CAG, ATC, AGC, CTG, CAT, TTT, GTA, CCA, ACT, GCG, ATC, CTT, TCG, CGT, CAG, GTG, GGG, GTG, ATT, CGC, AAA, CAG, GCG, CTG, ATC, CTT, AAC, TTA, CCC, GGT, CAA, CCG, AAG, TCT, ATT, AAA, GAG, ACG, CTG, GAA, GGT, GTG, AAG, GAC, GCT, GAG, GGT, AAC, GTT, GTG, GTG, CAC, GGT, ATT, TTT, GCC, AGC, GTA, CCG, TAC, TGC, ATT, CAG, TTG, CTG, GAA, GGG, CCA, TAC, GTT, GAA, ACG, GCA, CCG, GAA, GTG, GTT, GCA, GCA, TTC, AGA, CCG, AAG, AGT, GCA, AGA, CGC, GAA, GTT, AGC, GAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: chaperone protein DnaK
|
||||||
|
Nucleotides: ATGGGTAAAATAATTGGTATCGACCTGGGTACTACCAACTCTTGTGTAGCGATTATGGATGGCACCACTCCTCGTGTACTGGAGAACGCCGAAGGCGATCGCACCACGCCTTCTATCATTGCCTATACCCAGGATGGTGAAACTCTGGTTGGTCAGCCGGCTAAACGTCAGGCAGTGACGAACCCGCAAAACACCCTGTTTGCGATTAAACGCCTGATTGGCCGCCGCTTCCAGGACGAAGAAGTACAGCGTGATGTTTCCATCATGCCGTTCAAAATTATTGCTGCTGATAACGGCGACGCATGGGTCGAAGTTAAAGGCCAGAAAATGGCACCGCCGCAGATCTCTGCTGAAGTGCTGAAAAAAATGAAGAAAACCGCTGAAGATTACCTGGGTGAACCGGTAACTGAAGCTGTTATTACCGTACCGGCATACTTTAACGATGCTCAGCGTCAGGCAACCAAAGACGCAGGCCGTATCGCTGGTCTGGAAGTAAAACGTATCATCAACGAACCGACCGCAGCTGCGCTGGCTTACGGTCTGGACAAAGGTACTGGCAACCGTACTATCGCGGTTTATGACCTGGGTGGTGGTACTTTCGATATTTCCATTATCGAAATCGACGAAGTTGACGGCGAAAAAACCTTCGAAGTTCTGGCAACCAACGGTGATACCCACCTGGGTGGTGAAGACTTCGACAGTCGTCTGATCAACTATCTGGTTGAAGAATTCAAGAAAGATCAGGGCATTGACCTGCGCAACGATCCGCTGGCAATGCAGCGCCTGAAAGAAGCGGCAGAAAAAGCGAAAATCGAACTGTCTTCCGCTCAGCAGACCGACGTTAACCTGCCGTACATCACTGCAGACGCGACCGGTCCGAAACACATGAACATCAAAGTGACTCGTGCGAAACTGGAAAGCCTGGTTGAAGATCTGGTAAACCGTTCCATTGAGCCGCTGAAAGTTGCACTGCAGGACGCTGGCCTGTCCGTATCTGATATCGACGACGTTATTCTCGTTGGTGGTCAGACTCGTATGCCAATGGTTCAGAAGAAAGTTGCTGAATTCTTTGGTAAAGAGCCGCGTAAAGATGTTAACCCGGACGAAGCTGTAGCCATCGGTGCTGCTGTTCAGGGTGGTGTTCTGACTGGTGACGTAAAAGACGTACTGCTGCTGGACGTTACCCCGCTGTCTCTGGGTATCGAAACCATGGGCGGTGTGATGACCACGCTGATCGCGAAAAACACCACTATCCCGACCAAGCACAGCCAGGTGTTCTCTACCGCTGAAGACAACCAGTCTGCGGTAACCATCCATGTGCTGCAGGGTGAACGTAAACGTGCGGCTGATAACAAATCTCTGGGTCAGTTCAACCTGGATGGTATCAACCCGGCACCGCGCGGCATGCCGCAGATCGAAGTTACCTTCGATATCGATGCTGACGGTATCCTGCACGTTTCCGCGAAAGACAAAAACAGCGGTAAAGAGCAGAAGATCACTATCAAGGCTTCTTCTGGTCTGAACGAAGATGAAATCCAGAAAATGGTACGCGACGCAGAAGCTAACGCCGAAGCTGACCGTAAGTTTGAAGAGCTGGTACAGACTCGCAACCAGGGCGACCATCTGCTGCACAGCACCCGTAAGCAGGTTGAAGAAGCAGGCGACAAACTGCCGGCTGACGACAAAACTGCTATCGAGTCTGCGCTGACTGCACTGGAAACTGCTCTGAAAGGTGAAGACAAAGCCGCTATCGAAGCGAAAATGCAGGAACTGGCACAGGTTTCCCAGAAACTGATGGAAATCGCCCAGCAGCAACATGCCCAGCAGCAGACTGCCGGTGCTGATGCTTCTGCAAACAACGCGAAAGATGACGATGTTGTCGACGCTGAATTTGAAGAAGTCAAAGACAAAAAATAA
|
||||||
|
Nuc. Counts: [541, 475, 504, 397]
|
||||||
|
Total Mass%: [29.0, 21.0, 30.3, 19.7] of 251714.2
|
||||||
|
Codons List: [ATG, GGT, AAA, ATA, ATT, GGT, ATC, GAC, CTG, GGT, ACT, ACC, AAC, TCT, TGT, GTA, GCG, ATT, ATG, GAT, GGC, ACC, ACT, CCT, CGT, GTA, CTG, GAG, AAC, GCC, GAA, GGC, GAT, CGC, ACC, ACG, CCT, TCT, ATC, ATT, GCC, TAT, ACC, CAG, GAT, GGT, GAA, ACT, CTG, GTT, GGT, CAG, CCG, GCT, AAA, CGT, CAG, GCA, GTG, ACG, AAC, CCG, CAA, AAC, ACC, CTG, TTT, GCG, ATT, AAA, CGC, CTG, ATT, GGC, CGC, CGC, TTC, CAG, GAC, GAA, GAA, GTA, CAG, CGT, GAT, GTT, TCC, ATC, ATG, CCG, TTC, AAA, ATT, ATT, GCT, GCT, GAT, AAC, GGC, GAC, GCA, TGG, GTC, GAA, GTT, AAA, GGC, CAG, AAA, ATG, GCA, CCG, CCG, CAG, ATC, TCT, GCT, GAA, GTG, CTG, AAA, AAA, ATG, AAG, AAA, ACC, GCT, GAA, GAT, TAC, CTG, GGT, GAA, CCG, GTA, ACT, GAA, GCT, GTT, ATT, ACC, GTA, CCG, GCA, TAC, TTT, AAC, GAT, GCT, CAG, CGT, CAG, GCA, ACC, AAA, GAC, GCA, GGC, CGT, ATC, GCT, GGT, CTG, GAA, GTA, AAA, CGT, ATC, ATC, AAC, GAA, CCG, ACC, GCA, GCT, GCG, CTG, GCT, TAC, GGT, CTG, GAC, AAA, GGT, ACT, GGC, AAC, CGT, ACT, ATC, GCG, GTT, TAT, GAC, CTG, GGT, GGT, GGT, ACT, TTC, GAT, ATT, TCC, ATT, ATC, GAA, ATC, GAC, GAA, GTT, GAC, GGC, GAA, AAA, ACC, TTC, GAA, GTT, CTG, GCA, ACC, AAC, GGT, GAT, ACC, CAC, CTG, GGT, GGT, GAA, GAC, TTC, GAC, AGT, CGT, CTG, ATC, AAC, TAT, CTG, GTT, GAA, GAA, TTC, AAG, AAA, GAT, CAG, GGC, ATT, GAC, CTG, CGC, AAC, GAT, CCG, CTG, GCA, ATG, CAG, CGC, CTG, AAA, GAA, GCG, GCA, GAA, AAA, GCG, AAA, ATC, GAA, CTG, TCT, TCC, GCT, CAG, CAG, ACC, GAC, GTT, AAC, CTG, CCG, TAC, ATC, ACT, GCA, GAC, GCG, ACC, GGT, CCG, AAA, CAC, ATG, AAC, ATC, AAA, GTG, ACT, CGT, GCG, AAA, CTG, GAA, AGC, CTG, GTT, GAA, GAT, CTG, GTA, AAC, CGT, TCC, ATT, GAG, CCG, CTG, AAA, GTT, GCA, CTG, CAG, GAC, GCT, GGC, CTG, TCC, GTA, TCT, GAT, ATC, GAC, GAC, GTT, ATT, CTC, GTT, GGT, GGT, CAG, ACT, CGT, ATG, CCA, ATG, GTT, CAG, AAG, AAA, GTT, GCT, GAA, TTC, TTT, GGT, AAA, GAG, CCG, CGT, AAA, GAT, GTT, AAC, CCG, GAC, GAA, GCT, GTA, GCC, ATC, GGT, GCT, GCT, GTT, CAG, GGT, GGT, GTT, CTG, ACT, GGT, GAC, GTA, AAA, GAC, GTA, CTG, CTG, CTG, GAC, GTT, ACC, CCG, CTG, TCT, CTG, GGT, ATC, GAA, ACC, ATG, GGC, GGT, GTG, ATG, ACC, ACG, CTG, ATC, GCG, AAA, AAC, ACC, ACT, ATC, CCG, ACC, AAG, CAC, AGC, CAG, GTG, TTC, TCT, ACC, GCT, GAA, GAC, AAC, CAG, TCT, GCG, GTA, ACC, ATC, CAT, GTG, CTG, CAG, GGT, GAA, CGT, AAA, CGT, GCG, GCT, GAT, AAC, AAA, TCT, CTG, GGT, CAG, TTC, AAC, CTG, GAT, GGT, ATC, AAC, CCG, GCA, CCG, CGC, GGC, ATG, CCG, CAG, ATC, GAA, GTT, ACC, TTC, GAT, ATC, GAT, GCT, GAC, GGT, ATC, CTG, CAC, GTT, TCC, GCG, AAA, GAC, AAA, AAC, AGC, GGT, AAA, GAG, CAG, AAG, ATC, ACT, ATC, AAG, GCT, TCT, TCT, GGT, CTG, AAC, GAA, GAT, GAA, ATC, CAG, AAA, ATG, GTA, CGC, GAC, GCA, GAA, GCT, AAC, GCC, GAA, GCT, GAC, CGT, AAG, TTT, GAA, GAG, CTG, GTA, CAG, ACT, CGC, AAC, CAG, GGC, GAC, CAT, CTG, CTG, CAC, AGC, ACC, CGT, AAG, CAG, GTT, GAA, GAA, GCA, GGC, GAC, AAA, CTG, CCG, GCT, GAC, GAC, AAA, ACT, GCT, ATC, GAG, TCT, GCG, CTG, ACT, GCA, CTG, GAA, ACT, GCT, CTG, AAA, GGT, GAA, GAC, AAA, GCC, GCT, ATC, GAA, GCG, AAA, ATG, CAG, GAA, CTG, GCA, CAG, GTT, TCC, CAG, AAA, CTG, ATG, GAA, ATC, GCC, CAG, CAG, CAA, CAT, GCC, CAG, CAG, CAG, ACT, GCC, GGT, GCT, GAT, GCT, TCT, GCA, AAC, AAC, GCG, AAA, GAT, GAC, GAT, GTT, GTC, GAC, GCT, GAA, TTT, GAA, GAA, GTC, AAA, GAC, AAA, AAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: chaperone protein DnaJ
|
||||||
|
Nucleotides: GTGCATTCATCTAGGGGCAATTTAAAAAAGATGGCTAAGCAAGATTATTACGAGATTTTAGGCGTTTCCAAAACAGCGGAAGAGCGTGAAATCAAAAAGGCCTACAAACGCCTGGCCATGAAATACCACCCGGACCGTAACCAGGGTGACAAAGAGGCCGAGGCGAAATTTAAAGAGATCAAGGAAGCTTATGAAGTTCTGACCGACTCGCAAAAACGTGCGGCATACGATCAGTATGGTCATGCTGCGTTTGAGCAAGGTGGCATGGGCGGCGGCGGTTTTGGCGGCGGCGCAGACTTCAGCGATATTTTTGGTGACGTTTTCGGCGATATTTTTGGCGGCGGACGTGGTCGTCAACGTGCGGCGCGCGGTGCTGATTTACGCTATAACATGGAGCTCACCCTCGAAGAAGCTGTACGTGGCGTGACCAAAGAGATCCGCATTCCGACTCTGGAAGAGTGTGACGTTTGCCACGGTAGCGGTGCAAAACCAGGTACACAGCCGCAGACCTGTCCGACCTGTCATGGTTCTGGCCAGGTGCAGATGCGCCAGGGTTTCTTTGCCGTGCAGCAGACCTGTCCACACTGTCAGGGCCGCGGTACGCTGATCAAAGATCCGTGCAACAAATGTCATGGTCATGGTCGTGTTGAGCGCAGCAAAACGCTGTCCGTTAAAATCCCGGCAGGGGTGGACACTGGAGACCGCATCCGTCTTGCGGGCGAAGGTGAAGCGGGTGAACACGGCGCACCGGCAGGCGATCTGTACGTTCAGGTTCAGGTTAAACAGCACCCGATTTTCGAGCGTGAAGGCAACAACCTGTATTGCGAAGTCCCGATCAACTTCGCTATGGCGGCGCTGGGTGGTGAAATCGAAGTACCGACCCTTGATGGTCGCGTCAAACTGAAAGTGCCTGGCGAAACCCAGACCGGTAAGCTGTTCCGTATGCGCGGTAAAGGCGTCAAGTCTGTCCGCGGTGGCGCACAGGGTGATTTGCTATGCCGCGTTGTTGTCGAAACACCGGTAGGTTTGAACGAGAAGCAGAAACAGCTGCTGCAAGAGCTGCAAGAAAGCTTTGGTGGCCCAACCGGCGAGCACAACAGCCCGCGTTCAAAGAGCTTCTTTGATGGCGTGAAGAAGTTTTTTGACGACCTGACTCGCTAA
|
||||||
|
Nuc. Counts: [287, 278, 352, 244]
|
||||||
|
Total Mass%: [25.3, 20.1, 34.7, 19.9] of 153391.5
|
||||||
|
Codons List: [GTG, CAT, TCA, TCT, AGG, GGC, AAT, TTA, AAA, AAG, ATG, GCT, AAG, CAA, GAT, TAT, TAC, GAG, ATT, TTA, GGC, GTT, TCC, AAA, ACA, GCG, GAA, GAG, CGT, GAA, ATC, AAA, AAG, GCC, TAC, AAA, CGC, CTG, GCC, ATG, AAA, TAC, CAC, CCG, GAC, CGT, AAC, CAG, GGT, GAC, AAA, GAG, GCC, GAG, GCG, AAA, TTT, AAA, GAG, ATC, AAG, GAA, GCT, TAT, GAA, GTT, CTG, ACC, GAC, TCG, CAA, AAA, CGT, GCG, GCA, TAC, GAT, CAG, TAT, GGT, CAT, GCT, GCG, TTT, GAG, CAA, GGT, GGC, ATG, GGC, GGC, GGC, GGT, TTT, GGC, GGC, GGC, GCA, GAC, TTC, AGC, GAT, ATT, TTT, GGT, GAC, GTT, TTC, GGC, GAT, ATT, TTT, GGC, GGC, GGA, CGT, GGT, CGT, CAA, CGT, GCG, GCG, CGC, GGT, GCT, GAT, TTA, CGC, TAT, AAC, ATG, GAG, CTC, ACC, CTC, GAA, GAA, GCT, GTA, CGT, GGC, GTG, ACC, AAA, GAG, ATC, CGC, ATT, CCG, ACT, CTG, GAA, GAG, TGT, GAC, GTT, TGC, CAC, GGT, AGC, GGT, GCA, AAA, CCA, GGT, ACA, CAG, CCG, CAG, ACC, TGT, CCG, ACC, TGT, CAT, GGT, TCT, GGC, CAG, GTG, CAG, ATG, CGC, CAG, GGT, TTC, TTT, GCC, GTG, CAG, CAG, ACC, TGT, CCA, CAC, TGT, CAG, GGC, CGC, GGT, ACG, CTG, ATC, AAA, GAT, CCG, TGC, AAC, AAA, TGT, CAT, GGT, CAT, GGT, CGT, GTT, GAG, CGC, AGC, AAA, ACG, CTG, TCC, GTT, AAA, ATC, CCG, GCA, GGG, GTG, GAC, ACT, GGA, GAC, CGC, ATC, CGT, CTT, GCG, GGC, GAA, GGT, GAA, GCG, GGT, GAA, CAC, GGC, GCA, CCG, GCA, GGC, GAT, CTG, TAC, GTT, CAG, GTT, CAG, GTT, AAA, CAG, CAC, CCG, ATT, TTC, GAG, CGT, GAA, GGC, AAC, AAC, CTG, TAT, TGC, GAA, GTC, CCG, ATC, AAC, TTC, GCT, ATG, GCG, GCG, CTG, GGT, GGT, GAA, ATC, GAA, GTA, CCG, ACC, CTT, GAT, GGT, CGC, GTC, AAA, CTG, AAA, GTG, CCT, GGC, GAA, ACC, CAG, ACC, GGT, AAG, CTG, TTC, CGT, ATG, CGC, GGT, AAA, GGC, GTC, AAG, TCT, GTC, CGC, GGT, GGC, GCA, CAG, GGT, GAT, TTG, CTA, TGC, CGC, GTT, GTT, GTC, GAA, ACA, CCG, GTA, GGT, TTG, AAC, GAG, AAG, CAG, AAA, CAG, CTG, CTG, CAA, GAG, CTG, CAA, GAA, AGC, TTT, GGT, GGC, CCA, ACC, GGC, GAG, CAC, AAC, AGC, CCG, CGT, TCA, AAG, AGC, TTC, TTT, GAT, GGC, GTG, AAG, AAG, TTT, TTT, GAC, GAC, CTG, ACT, CGC, TAA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: TTGCTCTTACTCGGATTCGTAAGCCGTGAAAACAGCAACCTCCGTCTGGCCAGTTCGGATGTGAACCTCACAGAGGTCTTTTCTCGTTACCAGCGCCGCCACTACGGCGGTGATACAGATGACGATCAGGGCGACAATCATCGCCTTATGCTGCTTCATTGCTCTCTTCTCCTTGACCTTTCGGTCAGTAAGAGGCACTCTACATGTGTTCTGCATATAGGGGGCCTCGGGTTGATGGTAAAATATCACTCGGGGCTTTTCTCTATCTGCCGTTCAGCTAATGCCTGA
|
||||||
|
Nuc. Counts: [58, 78, 69, 83]
|
||||||
|
Total Mass%: [21.0, 23.2, 27.9, 27.8] of 37315.2
|
||||||
|
Codons List: [TTG, CTC, TTA, CTC, GGA, TTC, GTA, AGC, CGT, GAA, AAC, AGC, AAC, CTC, CGT, CTG, GCC, AGT, TCG, GAT, GTG, AAC, CTC, ACA, GAG, GTC, TTT, TCT, CGT, TAC, CAG, CGC, CGC, CAC, TAC, GGC, GGT, GAT, ACA, GAT, GAC, GAT, CAG, GGC, GAC, AAT, CAT, CGC, CTT, ATG, CTG, CTT, CAT, TGC, TCT, CTT, CTC, CTT, GAC, CTT, TCG, GTC, AGT, AAG, AGG, CAC, TCT, ACA, TGT, GTT, CTG, CAT, ATA, GGG, GGC, CTC, GGG, TTG, ATG, GTA, AAA, TAT, CAC, TCG, GGG, CTT, TTC, TCT, ATC, TGC, CGT, TCA, GCT, AAT, GCC, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: hypothetical protein
|
||||||
|
Nucleotides: ATGTCTGCCAAAAGACGACTTCTTATTGCGTGTACCTTGATAACAGCTATCTATCATTTTCCTGCATATTCTTCATTAGAATATAAAGGATCCTTTGGTTCAATAAATGCGGGTTATGCAGACTGGAATAGTGGATTTGTAAACACTCACCGTGGTGAAGTATGGAAAGTGACTGCGGATTTTGGGGTAAATTTTAAAGAAGCAGAATTTTACTCATTTTATGAAAGTAATGTACTCAATCATGCTGTAGCAGGGAGAAATCATACGGTTTCAGCAATGACGCATGTCAGACTCTTTGACTCTGATATGACATTCTTTGGCAAAATTTATGGCCAATGGGATAACTCATGGGGTGACGATCTGGACATGTTTTATGGATTCGGTTACCTCGGCTGGAACGGCGAGTGGGGCTTTTTTAAACCGTATATTGGATTGCATAATCAATCTGGTGACTACGTATCAGCTAAATATGGTCAAACGAATGGTTGGAATGGTTATGTTGTTGGCTGGACAGCAGTATTACCATTTACGTTATTTGACGAAAAATTTGTTTTATCTAACTGGAATGAAATAGAACTGGACAGGAACGATGCTTACACGGAGCAGCAATTTGGCCGGAACGGGTTAAATGGCGGTTTAACTATTGCCTGGAAGTTCTATCCTCGCTGGAAAGCCAGTGTGACGTGGCGTTATTTCGATAATAAGCTGGGCTACGATGGCTTTGGCGATCAAATGATTTATATGCTTGGTTATGATTTCTAA
|
||||||
|
Nuc. Counts: [214, 121, 184, 243]
|
||||||
|
Total Mass%: [28.8, 13.4, 27.7, 30.2] of 100569.4
|
||||||
|
Codons List: [ATG, TCT, GCC, AAA, AGA, CGA, CTT, CTT, ATT, GCG, TGT, ACC, TTG, ATA, ACA, GCT, ATC, TAT, CAT, TTT, CCT, GCA, TAT, TCT, TCA, TTA, GAA, TAT, AAA, GGA, TCC, TTT, GGT, TCA, ATA, AAT, GCG, GGT, TAT, GCA, GAC, TGG, AAT, AGT, GGA, TTT, GTA, AAC, ACT, CAC, CGT, GGT, GAA, GTA, TGG, AAA, GTG, ACT, GCG, GAT, TTT, GGG, GTA, AAT, TTT, AAA, GAA, GCA, GAA, TTT, TAC, TCA, TTT, TAT, GAA, AGT, AAT, GTA, CTC, AAT, CAT, GCT, GTA, GCA, GGG, AGA, AAT, CAT, ACG, GTT, TCA, GCA, ATG, ACG, CAT, GTC, AGA, CTC, TTT, GAC, TCT, GAT, ATG, ACA, TTC, TTT, GGC, AAA, ATT, TAT, GGC, CAA, TGG, GAT, AAC, TCA, TGG, GGT, GAC, GAT, CTG, GAC, ATG, TTT, TAT, GGA, TTC, GGT, TAC, CTC, GGC, TGG, AAC, GGC, GAG, TGG, GGC, TTT, TTT, AAA, CCG, TAT, ATT, GGA, TTG, CAT, AAT, CAA, TCT, GGT, GAC, TAC, GTA, TCA, GCT, AAA, TAT, GGT, CAA, ACG, AAT, GGT, TGG, AAT, GGT, TAT, GTT, GTT, GGC, TGG, ACA, GCA, GTA, TTA, CCA, TTT, ACG, TTA, TTT, GAC, GAA, AAA, TTT, GTT, TTA, TCT, AAC, TGG, AAT, GAA, ATA, GAA, CTG, GAC, AGG, AAC, GAT, GCT, TAC, ACG, GAG, CAG, CAA, TTT, GGC, CGG, AAC, GGG, TTA, AAT, GGC, GGT, TTA, ACT, ATT, GCC, TGG, AAG, TTC, TAT, CCT, CGC, TGG, AAA, GCC, AGT, GTG, ACG, TGG, CGT, TAT, TTC, GAT, AAT, AAG, CTG, GGC, TAC, GAT, GGC, TTT, GGC, GAT, CAA, ATG, ATT, TAT, ATG, CTT, GGT, TAT, GAT, TTC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: putative secreted sulfatase
|
||||||
|
Nucleotides: ATGCAGAAAACGTTAATGGCCAGTTTGATCGGCCTTGCAGTTTGCACAGGGAATGCTTTTAGTCCTGCCTTAGCCGCAGAGGCTAAACAACCTAATTTAGTCATTATTATGGCGGATGATTTAGGTTATGGCGATTTAGCAACATATGGTCATCAGATCGTTAAAACACCTAATATCGACAGGCTTGCCCAGGAAGGGGTCAAATTTACTGACTACTATGCCCCCGCTCCTTTAAGTTCACCTTCACGCGCAGGGCTATTAACCGGCCGGATGCCATTTCGTACTGGAATTCGCTCATGGATTCCTTCAGGCAAAGATGTTGCCTTAGGGCGTAACGAACTCACGATTGCTAATCTACTCAAAGCGCAAGGGTACGACACGGCAATGATGGGTAAGCTGCATCTGAATGCAGGCGGCGATCGCACCGATCAGCCACAAGCACAAGATATGGGCTTTGATTACTCACTGGTTAATACGGCGGGCTTTGTTACCGACGCCACGCTGGATAACGCTAAAGAACGCCCGCGTTATGGCATGGTTTACCCGACAGGCTGGCTACGTAACGGGCAACCCACTCCACGAGCTGATAAAATGAGCGGTGAGTATGTCAGTTCGGAAGTCGTCAACTGGCTGGATAACAAAAAGGACAGCAAGCCTTTCTTCCTCTATGTTGCTTTTACCGAAGTGCATAGCCCCCTGGCTTCGCCCAAAAAATACCTCGATATGTACTCACAATATATGAGCGCGTATCAGAAGCAGCATCCTGATTTATTTTATGGCGACTGGGCAGACAAACCCTGGCGTGGTGTGGGGGAATATTATGCCAATATCAGCTATCTGGATGCACAGGTTGGAAAAGTGCTGGATAAAATCAAAGCTGTGGGTGAAGAAGATAACACAATCGTTATTTTTACCAGTGATAACGGTCCGGTAACGCGTGAAGCGCGCAAAGTGTATGAGCTGAATTTGGCAGGGGAAACGGATGGATTACGCGGTCGCAAGGATAACCTTTGGGAAGGCGGAATTCGTGTTCCAGCCATTATTAAATATGGTAAACATCTACCACAGGGAATGGTTTCAGATACACCCGTTTATGGTCTGGACTGGATGCCTACTTTAGCGAAAATGATGAACTTCAAATTACCTACAGACCGTACTTTCGATGGTGAATCGCTGGTTCCTGTTCTTGAGCAAAAAGCATTGAAACGCGAAAAGCCATTAATTTTCGGGATTGATATGCCATTCCAGGATGATCCAACCGATGAATGGGCGATCCGTGATGGTGACTGGAAGATGATTATCGATCGCAATAATAAACCGAAATATCTCTACAATCTGAAATCTGATCGTTATGAAACACTTAATCTGATCGGTAAAAAAACAGATATTGAAAAACAGATGTATGGTAAGTTTTTAAAATATAAAACTGATATTGATAATGATTCTCTAATGAAAGCCAGAGGTGATAAACCAGAAGCGGTGACCTGGGGCTAA
|
||||||
|
Nuc. Counts: [440, 312, 362, 380]
|
||||||
|
Total Mass%: [30.3, 17.7, 27.9, 24.2] of 196369.5
|
||||||
|
Codons List: [ATG, CAG, AAA, ACG, TTA, ATG, GCC, AGT, TTG, ATC, GGC, CTT, GCA, GTT, TGC, ACA, GGG, AAT, GCT, TTT, AGT, CCT, GCC, TTA, GCC, GCA, GAG, GCT, AAA, CAA, CCT, AAT, TTA, GTC, ATT, ATT, ATG, GCG, GAT, GAT, TTA, GGT, TAT, GGC, GAT, TTA, GCA, ACA, TAT, GGT, CAT, CAG, ATC, GTT, AAA, ACA, CCT, AAT, ATC, GAC, AGG, CTT, GCC, CAG, GAA, GGG, GTC, AAA, TTT, ACT, GAC, TAC, TAT, GCC, CCC, GCT, CCT, TTA, AGT, TCA, CCT, TCA, CGC, GCA, GGG, CTA, TTA, ACC, GGC, CGG, ATG, CCA, TTT, CGT, ACT, GGA, ATT, CGC, TCA, TGG, ATT, CCT, TCA, GGC, AAA, GAT, GTT, GCC, TTA, GGG, CGT, AAC, GAA, CTC, ACG, ATT, GCT, AAT, CTA, CTC, AAA, GCG, CAA, GGG, TAC, GAC, ACG, GCA, ATG, ATG, GGT, AAG, CTG, CAT, CTG, AAT, GCA, GGC, GGC, GAT, CGC, ACC, GAT, CAG, CCA, CAA, GCA, CAA, GAT, ATG, GGC, TTT, GAT, TAC, TCA, CTG, GTT, AAT, ACG, GCG, GGC, TTT, GTT, ACC, GAC, GCC, ACG, CTG, GAT, AAC, GCT, AAA, GAA, CGC, CCG, CGT, TAT, GGC, ATG, GTT, TAC, CCG, ACA, GGC, TGG, CTA, CGT, AAC, GGG, CAA, CCC, ACT, CCA, CGA, GCT, GAT, AAA, ATG, AGC, GGT, GAG, TAT, GTC, AGT, TCG, GAA, GTC, GTC, AAC, TGG, CTG, GAT, AAC, AAA, AAG, GAC, AGC, AAG, CCT, TTC, TTC, CTC, TAT, GTT, GCT, TTT, ACC, GAA, GTG, CAT, AGC, CCC, CTG, GCT, TCG, CCC, AAA, AAA, TAC, CTC, GAT, ATG, TAC, TCA, CAA, TAT, ATG, AGC, GCG, TAT, CAG, AAG, CAG, CAT, CCT, GAT, TTA, TTT, TAT, GGC, GAC, TGG, GCA, GAC, AAA, CCC, TGG, CGT, GGT, GTG, GGG, GAA, TAT, TAT, GCC, AAT, ATC, AGC, TAT, CTG, GAT, GCA, CAG, GTT, GGA, AAA, GTG, CTG, GAT, AAA, ATC, AAA, GCT, GTG, GGT, GAA, GAA, GAT, AAC, ACA, ATC, GTT, ATT, TTT, ACC, AGT, GAT, AAC, GGT, CCG, GTA, ACG, CGT, GAA, GCG, CGC, AAA, GTG, TAT, GAG, CTG, AAT, TTG, GCA, GGG, GAA, ACG, GAT, GGA, TTA, CGC, GGT, CGC, AAG, GAT, AAC, CTT, TGG, GAA, GGC, GGA, ATT, CGT, GTT, CCA, GCC, ATT, ATT, AAA, TAT, GGT, AAA, CAT, CTA, CCA, CAG, GGA, ATG, GTT, TCA, GAT, ACA, CCC, GTT, TAT, GGT, CTG, GAC, TGG, ATG, CCT, ACT, TTA, GCG, AAA, ATG, ATG, AAC, TTC, AAA, TTA, CCT, ACA, GAC, CGT, ACT, TTC, GAT, GGT, GAA, TCG, CTG, GTT, CCT, GTT, CTT, GAG, CAA, AAA, GCA, TTG, AAA, CGC, GAA, AAG, CCA, TTA, ATT, TTC, GGG, ATT, GAT, ATG, CCA, TTC, CAG, GAT, GAT, CCA, ACC, GAT, GAA, TGG, GCG, ATC, CGT, GAT, GGT, GAC, TGG, AAG, ATG, ATT, ATC, GAT, CGC, AAT, AAT, AAA, CCG, AAA, TAT, CTC, TAC, AAT, CTG, AAA, TCT, GAT, CGT, TAT, GAA, ACA, CTT, AAT, CTG, ATC, GGT, AAA, AAA, ACA, GAT, ATT, GAA, AAA, CAG, ATG, TAT, GGT, AAG, TTT, TTA, AAA, TAT, AAA, ACT, GAT, ATT, GAT, AAT, GAT, TCT, CTA, ATG, AAA, GCC, AGA, GGT, GAT, AAA, CCA, GAA, GCG, GTG, ACC, TGG, GGC, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: putative cytoplasmic protein
|
||||||
|
Nucleotides: ATGTTTACCAACGTAAATGTTGATTGTTGCAAAACACCAGGATGTAAAAACCTGGGGTTGCTGAATAGCCAGGATTATGTCGCACAGGGTAAAAATATTTTATGCCGTGAATGTGGTTACTTGTTTCCAGTGATATCTGAACAGTCGCTTAATATTTATCGTAATATTGTGAATCACTCCTGGAGAGGTTTGATTTGCCAATGTTCAACTTGCGGAGGCACGTCCCTCAAAAAATATGGATATTCTGCACAAGGCCAGAGAAGAATGTATTGCCATCATTGTGAGAAAACATTTATCACTCTGGAACATGTAATTACCACACCACGAGGAGCCCTGTTAGCATTGATGATTGAGCAAGGGGAGGCACTTGCGGATATCAGAAAGTCATTACGTCTTAACAGCACTGGACTTAGCCGTGAACTGTTAAAATTAGCGCGTGAAGCAAACTATAAAGAAAGTCGACAGTGTTTCCCTGCTTCTGATATTACCCTGAGTACCCGCGCTTTTCGCGTCAAGTATAATGGTAGCAATAACTCTCTTTATGCTCTTGTTACCGCAGAAGAACAAAGCGGCAGGGTGGTTGCCATCTCAACCAATTACTCCCCATCTGCCGTAGAGCAACATTATCAATACACATCGAACTATGAAGAGCGTATGTCTCCAGGGACGCTGGCACATCATGTCCAGCGCAAAGAGTTACTTACTATGCGGCGGGATACCTTGTTTGATATTGATTACGGCCCGGCAGTTTTACATCAAAACGATCCGGGAATGTTGGTAAAACCGGTTCTTCCGGCATATCGTCATTTTGAACTGGTCAGAATACTGACCGATGAGCATTCCAACAACGTTCAGCATTACCTTGATCACGAATGCTTTATATTGGGCGGCTGCCTGATGGCTAATTTGCAGCATATTCATCAAGGTCGCTGCCATATTTCCTTTGTCAAAGAGCGCGGTGTGGCACCCGCCACCATTGATTTTCCACCGCGATTATTCCTTAGTGGTGGGGTACGAAATAATGTCTGGCGTGCATTTTCTAACCGCAATTATTCAATGGCTGTATGCAATCTCACTGGCAGTAAGAAAGTCCGCGAGATGCGGCATGCAACATTGAACAGTGCGACGCGTTTTATCCACTTTGTGGAGAACCATCCTTTCCTTATATCATTGAACCGAATGTCTCCTGCGAATGTCGTTTCTACATTAGATATCCTCAAACATCTGTGGAATAAAAAACTAGAGCATGGAACAATTTAA
|
||||||
|
Nuc. Counts: [355, 273, 276, 356]
|
||||||
|
Total Mass%: [29.2, 18.4, 25.3, 27.1] of 164551.0
|
||||||
|
Codons List: [ATG, TTT, ACC, AAC, GTA, AAT, GTT, GAT, TGT, TGC, AAA, ACA, CCA, GGA, TGT, AAA, AAC, CTG, GGG, TTG, CTG, AAT, AGC, CAG, GAT, TAT, GTC, GCA, CAG, GGT, AAA, AAT, ATT, TTA, TGC, CGT, GAA, TGT, GGT, TAC, TTG, TTT, CCA, GTG, ATA, TCT, GAA, CAG, TCG, CTT, AAT, ATT, TAT, CGT, AAT, ATT, GTG, AAT, CAC, TCC, TGG, AGA, GGT, TTG, ATT, TGC, CAA, TGT, TCA, ACT, TGC, GGA, GGC, ACG, TCC, CTC, AAA, AAA, TAT, GGA, TAT, TCT, GCA, CAA, GGC, CAG, AGA, AGA, ATG, TAT, TGC, CAT, CAT, TGT, GAG, AAA, ACA, TTT, ATC, ACT, CTG, GAA, CAT, GTA, ATT, ACC, ACA, CCA, CGA, GGA, GCC, CTG, TTA, GCA, TTG, ATG, ATT, GAG, CAA, GGG, GAG, GCA, CTT, GCG, GAT, ATC, AGA, AAG, TCA, TTA, CGT, CTT, AAC, AGC, ACT, GGA, CTT, AGC, CGT, GAA, CTG, TTA, AAA, TTA, GCG, CGT, GAA, GCA, AAC, TAT, AAA, GAA, AGT, CGA, CAG, TGT, TTC, CCT, GCT, TCT, GAT, ATT, ACC, CTG, AGT, ACC, CGC, GCT, TTT, CGC, GTC, AAG, TAT, AAT, GGT, AGC, AAT, AAC, TCT, CTT, TAT, GCT, CTT, GTT, ACC, GCA, GAA, GAA, CAA, AGC, GGC, AGG, GTG, GTT, GCC, ATC, TCA, ACC, AAT, TAC, TCC, CCA, TCT, GCC, GTA, GAG, CAA, CAT, TAT, CAA, TAC, ACA, TCG, AAC, TAT, GAA, GAG, CGT, ATG, TCT, CCA, GGG, ACG, CTG, GCA, CAT, CAT, GTC, CAG, CGC, AAA, GAG, TTA, CTT, ACT, ATG, CGG, CGG, GAT, ACC, TTG, TTT, GAT, ATT, GAT, TAC, GGC, CCG, GCA, GTT, TTA, CAT, CAA, AAC, GAT, CCG, GGA, ATG, TTG, GTA, AAA, CCG, GTT, CTT, CCG, GCA, TAT, CGT, CAT, TTT, GAA, CTG, GTC, AGA, ATA, CTG, ACC, GAT, GAG, CAT, TCC, AAC, AAC, GTT, CAG, CAT, TAC, CTT, GAT, CAC, GAA, TGC, TTT, ATA, TTG, GGC, GGC, TGC, CTG, ATG, GCT, AAT, TTG, CAG, CAT, ATT, CAT, CAA, GGT, CGC, TGC, CAT, ATT, TCC, TTT, GTC, AAA, GAG, CGC, GGT, GTG, GCA, CCC, GCC, ACC, ATT, GAT, TTT, CCA, CCG, CGA, TTA, TTC, CTT, AGT, GGT, GGG, GTA, CGA, AAT, AAT, GTC, TGG, CGT, GCA, TTT, TCT, AAC, CGC, AAT, TAT, TCA, ATG, GCT, GTA, TGC, AAT, CTC, ACT, GGC, AGT, AAG, AAA, GTC, CGC, GAG, ATG, CGG, CAT, GCA, ACA, TTG, AAC, AGT, GCG, ACG, CGT, TTT, ATC, CAC, TTT, GTG, GAG, AAC, CAT, CCT, TTC, CTT, ATA, TCA, TTG, AAC, CGA, ATG, TCT, CCT, GCG, AAT, GTC, GTT, TCT, ACA, TTA, GAT, ATC, CTC, AAA, CAT, CTG, TGG, AAT, AAA, AAA, CTA, GAG, CAT, GGA, ACA, ATT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: sodium/proton antiporter 1
|
||||||
|
Nucleotides: GTGAAACATCTGCATCGATTCTTTAGCAGTGATGCCTCGGGAGGCATTATTCTCATTATTGCCGCTGTATTAGCGATGATTATGGCCAACAGCGGTGCAACCAGTGGATGGTATCACGACTTTCTTGAGACGCCGGTTCAGCTCCGGGTTGGGACACTTGAGATCAACAAGAACATGCTGCTATGGATCAATGACGCTCTGATGGCGGTATTTTTCCTGTTGGTTGGTCTGGAAGTTAAACGCGAGCTGATGCAAGGTTCGCTGGCCAGTCTGCGCCAGGCGGCATTTCCTGTTATTGCCGCAATCGGCGGGATGATTGTCCCGGCATTGCTCTATCTGGCTTTTAACTATGCCGATCCGATTACCCGCGAAGGCTGGGCAATCCCGGCGGCGACTGACATTGCCTTTGCACTTGGTGTGTTGGCGCTGTTGGGAAGTCGTGTTCCGTTAGCGCTGAAGATCTTTTTGATGGCTCTGGCTATTATCGACGATCTTGGGGCCATCATTATCATCGCATTGTTCTACACTAATGACTTATCGATGGCCTCTCTTGGCGTCGCGGCTGTAGCAATTGCGGTACTCGCGGTATTGAATCTGTGTGGTGTACGCCGCACGGGCGTTTATATTCTGGTTGGCGTGGTGCTGTGGACAGCGGTGTTGAAATCGGGGGTTCACGCAACCCTGGCTGGCGTCATTGTCGGCTTCTTTATTCCTTTGAAAGAGAAGCATGGGCGCTCTCCGGCTAAACGTCTGGAGCATGTTTTGCATCCATGGGTGGCGTATCTGATTTTGCCGCTGTTTGCATTTGCTAATGCTGGCGTTTCACTGCAAGGTGTCACGCTGGAAGGTTTGACCTCCATTCTGCCATTAGGGATCATCGCTGGTTTGCTGATTGGCAAGCCACTGGGTATTAGTCTGTTCTGCTGGTTGGCGCTGCGTTTGAAATTGGCACATCTGCCAGAGGGAACGACTTACCAGCAAATTATGGCGGTTGGTATCCTGTGCGGTATCGGTTTTACTATGTCTATCTTTATTGCCAGCCTGGCATTTGGTAGCGTAGATCCAGAACTGATTAACTGGGCAAAATTAGGTATCCTTGTCGGTTCAATTTCTTCGGCGGTAATTGGATATAGCTGGTTACGCGTTCGTTTACGTCCATCAGTTTGA
|
||||||
|
Nuc. Counts: [215, 258, 331, 363]
|
||||||
|
Total Mass%: [19.0, 18.7, 32.7, 29.7] of 153154.3
|
||||||
|
Codons List: [GTG, AAA, CAT, CTG, CAT, CGA, TTC, TTT, AGC, AGT, GAT, GCC, TCG, GGA, GGC, ATT, ATT, CTC, ATT, ATT, GCC, GCT, GTA, TTA, GCG, ATG, ATT, ATG, GCC, AAC, AGC, GGT, GCA, ACC, AGT, GGA, TGG, TAT, CAC, GAC, TTT, CTT, GAG, ACG, CCG, GTT, CAG, CTC, CGG, GTT, GGG, ACA, CTT, GAG, ATC, AAC, AAG, AAC, ATG, CTG, CTA, TGG, ATC, AAT, GAC, GCT, CTG, ATG, GCG, GTA, TTT, TTC, CTG, TTG, GTT, GGT, CTG, GAA, GTT, AAA, CGC, GAG, CTG, ATG, CAA, GGT, TCG, CTG, GCC, AGT, CTG, CGC, CAG, GCG, GCA, TTT, CCT, GTT, ATT, GCC, GCA, ATC, GGC, GGG, ATG, ATT, GTC, CCG, GCA, TTG, CTC, TAT, CTG, GCT, TTT, AAC, TAT, GCC, GAT, CCG, ATT, ACC, CGC, GAA, GGC, TGG, GCA, ATC, CCG, GCG, GCG, ACT, GAC, ATT, GCC, TTT, GCA, CTT, GGT, GTG, TTG, GCG, CTG, TTG, GGA, AGT, CGT, GTT, CCG, TTA, GCG, CTG, AAG, ATC, TTT, TTG, ATG, GCT, CTG, GCT, ATT, ATC, GAC, GAT, CTT, GGG, GCC, ATC, ATT, ATC, ATC, GCA, TTG, TTC, TAC, ACT, AAT, GAC, TTA, TCG, ATG, GCC, TCT, CTT, GGC, GTC, GCG, GCT, GTA, GCA, ATT, GCG, GTA, CTC, GCG, GTA, TTG, AAT, CTG, TGT, GGT, GTA, CGC, CGC, ACG, GGC, GTT, TAT, ATT, CTG, GTT, GGC, GTG, GTG, CTG, TGG, ACA, GCG, GTG, TTG, AAA, TCG, GGG, GTT, CAC, GCA, ACC, CTG, GCT, GGC, GTC, ATT, GTC, GGC, TTC, TTT, ATT, CCT, TTG, AAA, GAG, AAG, CAT, GGG, CGC, TCT, CCG, GCT, AAA, CGT, CTG, GAG, CAT, GTT, TTG, CAT, CCA, TGG, GTG, GCG, TAT, CTG, ATT, TTG, CCG, CTG, TTT, GCA, TTT, GCT, AAT, GCT, GGC, GTT, TCA, CTG, CAA, GGT, GTC, ACG, CTG, GAA, GGT, TTG, ACC, TCC, ATT, CTG, CCA, TTA, GGG, ATC, ATC, GCT, GGT, TTG, CTG, ATT, GGC, AAG, CCA, CTG, GGT, ATT, AGT, CTG, TTC, TGC, TGG, TTG, GCG, CTG, CGT, TTG, AAA, TTG, GCA, CAT, CTG, CCA, GAG, GGA, ACG, ACT, TAC, CAG, CAA, ATT, ATG, GCG, GTT, GGT, ATC, CTG, TGC, GGT, ATC, GGT, TTT, ACT, ATG, TCT, ATC, TTT, ATT, GCC, AGC, CTG, GCA, TTT, GGT, AGC, GTA, GAT, CCA, GAA, CTG, ATT, AAC, TGG, GCA, AAA, TTA, GGT, ATC, CTT, GTC, GGT, TCA, ATT, TCT, TCG, GCG, GTA, ATT, GGA, TAT, AGC, TGG, TTA, CGC, GTT, CGT, TTA, CGT, CCA, TCA, GTT, TGA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: transcriptional activator protein NhaR
|
||||||
|
Nucleotides: ATGAGCATGTCTCATATCAATTACAACCACTTGTATTACTTCTGGCATGTCTACAAAGAAGGTTCTGTGGTTGGCGCAGCGGAGGCGCTTTATTTAACACCACAAACCATTACCGGGCAGATCCGGGCGCTGGAAGAGCGCCTGCAAGGGAAACTATTTAAGCGTAAAGGACGTGGTCTGGAACCCAGCGAACTGGGGGAACTGGTCTATCGCTATGCCGATAAAATGTTCACCTTAAGCCAGGAAATGCTGGATATCGTCAACTATCGCAAAGAGTCCAACTTATTGTTTGATGTTGGTGTGGCAGATGCACTTTCCAAACGTCTGGTCAGCAGTGTTCTGGATGCCGCAGTTGTGGAAGACGAGCAGATCCATCTACGCTGTTTCGAATCGACGCACGAGATGCTTTTAGAGCAGTTGAGTCAGCATAAACTGGATATGATCATCTCTGACTGTCCGATCGATTCCACTCAGCAGGAAGGGCTGTTTTCCATGAAAATTGGCGAATGTGGTGTCAGTTTCTGGTGCACTAACCCACTACCAGAAAAGCCGTTTCCTGCCTGTCTTGAAGAGCGTCGTTTACTTATTCCGGGGCGTCGCTCAATGTTGGGGCGTAAACTATTAAACTGGTTTAACTCCCAGGGCTTGAACGTCGAAATTTTGGGTGAGTTTGATGATGCTGCGTTGATGAAAGCCTTTGGGGCGACGCATAACGCTATTTTCGTTGCACCTTCGCTTTACGCTAATGATTTCTATAACGATGACTCGGTTGTGGAGATAGGCCGTGTTGAGAACGTGATGGAAGAGTACCACGCGATTTTTGCCGAAAGGATGATTCAGCACCCTGCAGTACAGCGTATCTGCAATACAGACTATTCTGCGCTGTTTACTCCAGCTTCAAAATAA
|
||||||
|
Nuc. Counts: [228, 197, 232, 249]
|
||||||
|
Total Mass%: [25.9, 18.4, 29.5, 26.2] of 118909.8
|
||||||
|
Codons List: [ATG, AGC, ATG, TCT, CAT, ATC, AAT, TAC, AAC, CAC, TTG, TAT, TAC, TTC, TGG, CAT, GTC, TAC, AAA, GAA, GGT, TCT, GTG, GTT, GGC, GCA, GCG, GAG, GCG, CTT, TAT, TTA, ACA, CCA, CAA, ACC, ATT, ACC, GGG, CAG, ATC, CGG, GCG, CTG, GAA, GAG, CGC, CTG, CAA, GGG, AAA, CTA, TTT, AAG, CGT, AAA, GGA, CGT, GGT, CTG, GAA, CCC, AGC, GAA, CTG, GGG, GAA, CTG, GTC, TAT, CGC, TAT, GCC, GAT, AAA, ATG, TTC, ACC, TTA, AGC, CAG, GAA, ATG, CTG, GAT, ATC, GTC, AAC, TAT, CGC, AAA, GAG, TCC, AAC, TTA, TTG, TTT, GAT, GTT, GGT, GTG, GCA, GAT, GCA, CTT, TCC, AAA, CGT, CTG, GTC, AGC, AGT, GTT, CTG, GAT, GCC, GCA, GTT, GTG, GAA, GAC, GAG, CAG, ATC, CAT, CTA, CGC, TGT, TTC, GAA, TCG, ACG, CAC, GAG, ATG, CTT, TTA, GAG, CAG, TTG, AGT, CAG, CAT, AAA, CTG, GAT, ATG, ATC, ATC, TCT, GAC, TGT, CCG, ATC, GAT, TCC, ACT, CAG, CAG, GAA, GGG, CTG, TTT, TCC, ATG, AAA, ATT, GGC, GAA, TGT, GGT, GTC, AGT, TTC, TGG, TGC, ACT, AAC, CCA, CTA, CCA, GAA, AAG, CCG, TTT, CCT, GCC, TGT, CTT, GAA, GAG, CGT, CGT, TTA, CTT, ATT, CCG, GGG, CGT, CGC, TCA, ATG, TTG, GGG, CGT, AAA, CTA, TTA, AAC, TGG, TTT, AAC, TCC, CAG, GGC, TTG, AAC, GTC, GAA, ATT, TTG, GGT, GAG, TTT, GAT, GAT, GCT, GCG, TTG, ATG, AAA, GCC, TTT, GGG, GCG, ACG, CAT, AAC, GCT, ATT, TTC, GTT, GCA, CCT, TCG, CTT, TAC, GCT, AAT, GAT, TTC, TAT, AAC, GAT, GAC, TCG, GTT, GTG, GAG, ATA, GGC, CGT, GTT, GAG, AAC, GTG, ATG, GAA, GAG, TAC, CAC, GCG, ATT, TTT, GCC, GAA, AGG, ATG, ATT, CAG, CAC, CCT, GCA, GTA, CAG, CGT, ATC, TGC, AAT, ACA, GAC, TAT, TCT, GCG, CTG, TTT, ACT, CCA, GCT, TCA, AAA, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: riboflavin kinase
|
||||||
|
Nucleotides: ATGAAGCTGATACGCGGCATACATAATCTCAGCCAGGCCCCGCAAGAAGGGTGTGTGCTGACTATTGGTAATTTCGACGGCGTGCATCGCGGTCATCGCGCGCTGTTACAGGGCTTGCAGGAAGAAGGGCGCAAGCGCAACTTACCGGTGATGGTGATGCTTTTTGAACCTCAACCACTGGAACTGTTTGCTACTGATAAAGCCCCGGCACGGCTCACCCGGCTGCGGGAAAAACTGCGTTATCTTGCAGAGTGTGGCGTTGATTACGTGCTGTGCGTGCGTTTTGACAGGCGTTTTGCGGCGTTAACCGCGCAAAACTTCATCAGTGATCTTCTGGTGAAGCACTTGCGGGTAAAATTTCTTGCCGTAGGTGACGATTTCCGCTTTGGCGCTGGTCGTGAAGGCGATTTCTTGTTATTACAGAAAGCGGGCATGGAATACGGCTTCGATATCACCAGCACGCAAACTTTTTGCGAAGGTGGTGTGCGTATCAGCAGCACCGCCGTGCGTCAGGCGCTTGCGGATGACAATCTGGCTCTGGCAGAAAGTTTACTGGGGCACCCGTTTGCTATCTCCGGGCGTGTAGTCCACGGTGATGAATTAGGGCGCACTATAGGTTTCCCGACGGCGAATGTACCGCTACGCCGTCAGGTTTCCCCGGTGAAAGGGGTTTATGCGGTAGAAGTGTTGGGCCTTGGCGAAAAGCCGTTACCCGGCGTTGCAAACATCGGAACACGCCCAACGGTTGCCGGTATTCGCCAGCAACTGGAAGTGCATTTGTTAGATGTTGCAATGGACCTTTATGGTCGCCATATACAAGTAGTGCTGCGTAAAAAAATACGCAATGAGCAGCGATTTGCATCGCTGGACGAACTGAAAGCGCAGATTGCGCGTGATGAATTAACCGCCCGCGAATTTTTTGGGCTAACAAAACCGGCTTAA
|
||||||
|
Nuc. Counts: [213, 221, 276, 232]
|
||||||
|
Total Mass%: [23.2, 19.8, 33.6, 23.4] of 124072.2
|
||||||
|
Codons List: [ATG, AAG, CTG, ATA, CGC, GGC, ATA, CAT, AAT, CTC, AGC, CAG, GCC, CCG, CAA, GAA, GGG, TGT, GTG, CTG, ACT, ATT, GGT, AAT, TTC, GAC, GGC, GTG, CAT, CGC, GGT, CAT, CGC, GCG, CTG, TTA, CAG, GGC, TTG, CAG, GAA, GAA, GGG, CGC, AAG, CGC, AAC, TTA, CCG, GTG, ATG, GTG, ATG, CTT, TTT, GAA, CCT, CAA, CCA, CTG, GAA, CTG, TTT, GCT, ACT, GAT, AAA, GCC, CCG, GCA, CGG, CTC, ACC, CGG, CTG, CGG, GAA, AAA, CTG, CGT, TAT, CTT, GCA, GAG, TGT, GGC, GTT, GAT, TAC, GTG, CTG, TGC, GTG, CGT, TTT, GAC, AGG, CGT, TTT, GCG, GCG, TTA, ACC, GCG, CAA, AAC, TTC, ATC, AGT, GAT, CTT, CTG, GTG, AAG, CAC, TTG, CGG, GTA, AAA, TTT, CTT, GCC, GTA, GGT, GAC, GAT, TTC, CGC, TTT, GGC, GCT, GGT, CGT, GAA, GGC, GAT, TTC, TTG, TTA, TTA, CAG, AAA, GCG, GGC, ATG, GAA, TAC, GGC, TTC, GAT, ATC, ACC, AGC, ACG, CAA, ACT, TTT, TGC, GAA, GGT, GGT, GTG, CGT, ATC, AGC, AGC, ACC, GCC, GTG, CGT, CAG, GCG, CTT, GCG, GAT, GAC, AAT, CTG, GCT, CTG, GCA, GAA, AGT, TTA, CTG, GGG, CAC, CCG, TTT, GCT, ATC, TCC, GGG, CGT, GTA, GTC, CAC, GGT, GAT, GAA, TTA, GGG, CGC, ACT, ATA, GGT, TTC, CCG, ACG, GCG, AAT, GTA, CCG, CTA, CGC, CGT, CAG, GTT, TCC, CCG, GTG, AAA, GGG, GTT, TAT, GCG, GTA, GAA, GTG, TTG, GGC, CTT, GGC, GAA, AAG, CCG, TTA, CCC, GGC, GTT, GCA, AAC, ATC, GGA, ACA, CGC, CCA, ACG, GTT, GCC, GGT, ATT, CGC, CAG, CAA, CTG, GAA, GTG, CAT, TTG, TTA, GAT, GTT, GCA, ATG, GAC, CTT, TAT, GGT, CGC, CAT, ATA, CAA, GTA, GTG, CTG, CGT, AAA, AAA, ATA, CGC, AAT, GAG, CAG, CGA, TTT, GCA, TCG, CTG, GAC, GAA, CTG, AAA, GCG, CAG, ATT, GCG, CGT, GAT, GAA, TTA, ACC, GCC, CGC, GAA, TTT, TTT, GGG, CTA, ACA, AAA, CCG, GCT, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Isoleucyl-tRNA synthetase
|
||||||
|
Nucleotides: ATGAGTGACTATAAATCAACCCTGAATTTGCCGGAAACAGGGTTCCCGATGCGTGGCGATCTCGCCAAGCGCGAACCGGGAATGCTGGCGCGTTGGACTGATGATGATCTGTACGGCATCATCCGTGCGGCTAAAAAAGGCAAAAAAACCTTCATTCTGCATGATGGCCCTCCTTATGCGAATGGCAGCATTCATATTGGTCACTCGGTTAACAAGATTCTGAAAGACATTATCATTAAGTCCAAAGGGCTTTCTGGATATGACTCGCCGTATGTGCCTGGCTGGGACTGTCATGGTCTGCCAATCGAACTGAAAGTAGAGCAAGAATACGGTAAGCCGGGGGAGAAATTCACCGCCGCTGAGTTCCGCGCCAAGTGCCGCGAATACGCTGCGACCCAGGTTGACGGTCAGCGCAAAGACTTTATCCGTCTGGGCGTGCTGGGCGACTGGTCGCACCCGTACCTGACCATGGACTTCAAAACTGAAGCCAACATCATCCGCGCGCTGGGCAAAATCATCGGCAACGGTCACCTGCACAAAGGCGCGAAGCCGGTGCACTGGTGCGTTGACTGCCGTTCTGCACTGGCAGAAGCGGAAGTTGAGTATTACGACAAAACTTCTCCGTCCATCGACGTCGCTTTCCAGGCGGTCGATCAGGATGCGCTGAAAACGAAATTTGGCGTAAGCAATGTTAACGGCCCAATTTCGCTGGTTATCTGGACCACCACGCCGTGGACGCTGCCTGCTAACCGCGCAATCTCCATTGCACCTGATTTTGATTATGCGCTGGTGCAAATCGACGGTCAGGCCGTGATCCTCGCGAAAGATCTGGTTGAAAGCGTAATGCAGCGTATCGGCGTTAGCGATTACACCATTCTTGGCACGGTGAAAGGTGCCGAGCTGGAACTGTTGCGCTTTACCCATCCGTTTATGGACTTCGATGTTCCGGCAATTCTCGGCGACCACGTTACGCTGGATGCCGGTACCGGTGCCGTTCATACCGCGCCAGGCCACGGTCCGGACGACTATGTGATCGGTCAAAAATATGGTCTGGAAACCGCTAACCCGGTTGGCCCGGACGGCACTTATCTGCCGGGTACTTACCCGACTCTGGATGGCGTTAACGTCTTCAAAGCGAACGATATTGTCATTGCGTTGTTGCAGGAAAAAGGCGCACTGTTGCACGTTGAGAAAATGCAACACAGCTATCCGTGCTGCTGGCGTCATAAAACGCCGATCATCTTCCGCGCGACGCCGCAGTGGTTCGTCAGCATGGATCAGAAAGGTCTGCGTGCGCAGTCACTGAAAGAGATCAAAGGCGTGCAGTGGATCCCTGACTGGGGCCAGGCGCGTATCGAGTCGATGGTTGCTAACCGTCCTGACTGGTGTATCTCTCGTCAGCGTACCTGGGGCGTGCCGATGTCACTGTTCGTGCACAAAGACACAGAAGAACTGCATCCGCGTACTCTCGAACTGATGGAAGAAGTGGCAAAACGCGTTGAAGTTGACGGCATTCAGGCGTGGTGGGATCTCGATGCGAAAGAGATCCTCGGCGACGAAGCTGACCAGTATGTGAAAGTACCGGATACGCTGGATGTATGGTTTGACTCCGGATCTACCCACTCTTCCGTTGTTGATGTGCGTCCGGAATTTGCCGGTCACGCAGCGGACATGTATCTGGAAGGTTCTGACCAACACCGTGGCTGGTTCATGTCTTCCCTGATGATCTCTACCGCGATGAAGGGCAAAGCGCCATATCGTCAGGTACTGACTCACGGCTTTACCGTGGATGGTCAGGGTCGCAAGATGTCTAAATCCATCGGTAACACCGTTTCGCCGCAGGATGTGATGAATAAACTGGGTGCGGATATTCTGCGTCTGTGGGTGGCATCAACCGACTACACTGGCGAAATGGCCGTTTCTGACGAGATCCTGAAACGTGCTGCCGACAGCTATCGTCGTATCCGTAACACCGCGCGCTTCCTGCTGGCAAACCTGAACGGTTTTGATCCGGCAAAAGATATGGTGAAACCGGAAGAGATGGTGGTACTGGATCGCTGGGCCGTAGGTTGTGCGAAAGCGGCACAGGAAGACATCCTCAAGGCGTACGAAGCATACGATTTCCACGAAGTGGTACAGCGTCTGATGCGCTTCTGCTCCGTTGAGATGGGTTCCTTCTACCTCGACATCATCAAAGACCGTCAGTATACCGCCAAAGCGGACAGCGTGGCGCGTCGTAGCTGCCAGACTGCGCTGTATCACATCGCAGAAGCGCTGGTTCGCTGGATGGCACCAATCCTCTCCTTCACCGCTGATGAAGTGTGGGGTTACCTGCCGGGCGAACGTGAAAAATACGTCTTCACCGGCGAGTGGTACGAAGGCCTGTTTGGTCTGGCAGACAGTGAAGCAATGAACGATGCGTTCTGGGACGAGCTGTTGAAAGTGCGTGGCGAAGTGAACAAAGTCATTGAGCAAGCGCGTGCCGATAAGAACGTGGGCGGCTCGCTGGAAGCGGCAGTAACCTTGTATGCAGAACCGGAACTGGCGGCGAAACTGACCGCGCTGGGCGATGAATTACGATTTGTCCTGTTGACCTCCGGCGCTACCGTTGCAGACTATAACGACGCACCTGCTGATGCCCAGCAGAGCGAAGTCCTCAAAGGGCTGAAAGTCGCGTTGAGTAAAGCCGAAGGTGAGAAGTGTCCTCGCTGCTGGCACTACACCCAGGATGTCGGCAAGGTGGCGGAACACGCAGAAATCTGCGGCCGCTGTGTCAGCAACGTCGCCGGTGACGGTGAAAAACGTAAGTTTGCCTGA
|
||||||
|
Nuc. Counts: [660, 720, 817, 620]
|
||||||
|
Total Mass%: [24.1, 21.6, 33.4, 21.0] of 370216.6
|
||||||
|
Codons List: [ATG, AGT, GAC, TAT, AAA, TCA, ACC, CTG, AAT, TTG, CCG, GAA, ACA, GGG, TTC, CCG, ATG, CGT, GGC, GAT, CTC, GCC, AAG, CGC, GAA, CCG, GGA, ATG, CTG, GCG, CGT, TGG, ACT, GAT, GAT, GAT, CTG, TAC, GGC, ATC, ATC, CGT, GCG, GCT, AAA, AAA, GGC, AAA, AAA, ACC, TTC, ATT, CTG, CAT, GAT, GGC, CCT, CCT, TAT, GCG, AAT, GGC, AGC, ATT, CAT, ATT, GGT, CAC, TCG, GTT, AAC, AAG, ATT, CTG, AAA, GAC, ATT, ATC, ATT, AAG, TCC, AAA, GGG, CTT, TCT, GGA, TAT, GAC, TCG, CCG, TAT, GTG, CCT, GGC, TGG, GAC, TGT, CAT, GGT, CTG, CCA, ATC, GAA, CTG, AAA, GTA, GAG, CAA, GAA, TAC, GGT, AAG, CCG, GGG, GAG, AAA, TTC, ACC, GCC, GCT, GAG, TTC, CGC, GCC, AAG, TGC, CGC, GAA, TAC, GCT, GCG, ACC, CAG, GTT, GAC, GGT, CAG, CGC, AAA, GAC, TTT, ATC, CGT, CTG, GGC, GTG, CTG, GGC, GAC, TGG, TCG, CAC, CCG, TAC, CTG, ACC, ATG, GAC, TTC, AAA, ACT, GAA, GCC, AAC, ATC, ATC, CGC, GCG, CTG, GGC, AAA, ATC, ATC, GGC, AAC, GGT, CAC, CTG, CAC, AAA, GGC, GCG, AAG, CCG, GTG, CAC, TGG, TGC, GTT, GAC, TGC, CGT, TCT, GCA, CTG, GCA, GAA, GCG, GAA, GTT, GAG, TAT, TAC, GAC, AAA, ACT, TCT, CCG, TCC, ATC, GAC, GTC, GCT, TTC, CAG, GCG, GTC, GAT, CAG, GAT, GCG, CTG, AAA, ACG, AAA, TTT, GGC, GTA, AGC, AAT, GTT, AAC, GGC, CCA, ATT, TCG, CTG, GTT, ATC, TGG, ACC, ACC, ACG, CCG, TGG, ACG, CTG, CCT, GCT, AAC, CGC, GCA, ATC, TCC, ATT, GCA, CCT, GAT, TTT, GAT, TAT, GCG, CTG, GTG, CAA, ATC, GAC, GGT, CAG, GCC, GTG, ATC, CTC, GCG, AAA, GAT, CTG, GTT, GAA, AGC, GTA, ATG, CAG, CGT, ATC, GGC, GTT, AGC, GAT, TAC, ACC, ATT, CTT, GGC, ACG, GTG, AAA, GGT, GCC, GAG, CTG, GAA, CTG, TTG, CGC, TTT, ACC, CAT, CCG, TTT, ATG, GAC, TTC, GAT, GTT, CCG, GCA, ATT, CTC, GGC, GAC, CAC, GTT, ACG, CTG, GAT, GCC, GGT, ACC, GGT, GCC, GTT, CAT, ACC, GCG, CCA, GGC, CAC, GGT, CCG, GAC, GAC, TAT, GTG, ATC, GGT, CAA, AAA, TAT, GGT, CTG, GAA, ACC, GCT, AAC, CCG, GTT, GGC, CCG, GAC, GGC, ACT, TAT, CTG, CCG, GGT, ACT, TAC, CCG, ACT, CTG, GAT, GGC, GTT, AAC, GTC, TTC, AAA, GCG, AAC, GAT, ATT, GTC, ATT, GCG, TTG, TTG, CAG, GAA, AAA, GGC, GCA, CTG, TTG, CAC, GTT, GAG, AAA, ATG, CAA, CAC, AGC, TAT, CCG, TGC, TGC, TGG, CGT, CAT, AAA, ACG, CCG, ATC, ATC, TTC, CGC, GCG, ACG, CCG, CAG, TGG, TTC, GTC, AGC, ATG, GAT, CAG, AAA, GGT, CTG, CGT, GCG, CAG, TCA, CTG, AAA, GAG, ATC, AAA, GGC, GTG, CAG, TGG, ATC, CCT, GAC, TGG, GGC, CAG, GCG, CGT, ATC, GAG, TCG, ATG, GTT, GCT, AAC, CGT, CCT, GAC, TGG, TGT, ATC, TCT, CGT, CAG, CGT, ACC, TGG, GGC, GTG, CCG, ATG, TCA, CTG, TTC, GTG, CAC, AAA, GAC, ACA, GAA, GAA, CTG, CAT, CCG, CGT, ACT, CTC, GAA, CTG, ATG, GAA, GAA, GTG, GCA, AAA, CGC, GTT, GAA, GTT, GAC, GGC, ATT, CAG, GCG, TGG, TGG, GAT, CTC, GAT, GCG, AAA, GAG, ATC, CTC, GGC, GAC, GAA, GCT, GAC, CAG, TAT, GTG, AAA, GTA, CCG, GAT, ACG, CTG, GAT, GTA, TGG, TTT, GAC, TCC, GGA, TCT, ACC, CAC, TCT, TCC, GTT, GTT, GAT, GTG, CGT, CCG, GAA, TTT, GCC, GGT, CAC, GCA, GCG, GAC, ATG, TAT, CTG, GAA, GGT, TCT, GAC, CAA, CAC, CGT, GGC, TGG, TTC, ATG, TCT, TCC, CTG, ATG, ATC, TCT, ACC, GCG, ATG, AAG, GGC, AAA, GCG, CCA, TAT, CGT, CAG, GTA, CTG, ACT, CAC, GGC, TTT, ACC, GTG, GAT, GGT, CAG, GGT, CGC, AAG, ATG, TCT, AAA, TCC, ATC, GGT, AAC, ACC, GTT, TCG, CCG, CAG, GAT, GTG, ATG, AAT, AAA, CTG, GGT, GCG, GAT, ATT, CTG, CGT, CTG, TGG, GTG, GCA, TCA, ACC, GAC, TAC, ACT, GGC, GAA, ATG, GCC, GTT, TCT, GAC, GAG, ATC, CTG, AAA, CGT, GCT, GCC, GAC, AGC, TAT, CGT, CGT, ATC, CGT, AAC, ACC, GCG, CGC, TTC, CTG, CTG, GCA, AAC, CTG, AAC, GGT, TTT, GAT, CCG, GCA, AAA, GAT, ATG, GTG, AAA, CCG, GAA, GAG, ATG, GTG, GTA, CTG, GAT, CGC, TGG, GCC, GTA, GGT, TGT, GCG, AAA, GCG, GCA, CAG, GAA, GAC, ATC, CTC, AAG, GCG, TAC, GAA, GCA, TAC, GAT, TTC, CAC, GAA, GTG, GTA, CAG, CGT, CTG, ATG, CGC, TTC, TGC, TCC, GTT, GAG, ATG, GGT, TCC, TTC, TAC, CTC, GAC, ATC, ATC, AAA, GAC, CGT, CAG, TAT, ACC, GCC, AAA, GCG, GAC, AGC, GTG, GCG, CGT, CGT, AGC, TGC, CAG, ACT, GCG, CTG, TAT, CAC, ATC, GCA, GAA, GCG, CTG, GTT, CGC, TGG, ATG, GCA, CCA, ATC, CTC, TCC, TTC, ACC, GCT, GAT, GAA, GTG, TGG, GGT, TAC, CTG, CCG, GGC, GAA, CGT, GAA, AAA, TAC, GTC, TTC, ACC, GGC, GAG, TGG, TAC, GAA, GGC, CTG, TTT, GGT, CTG, GCA, GAC, AGT, GAA, GCA, ATG, AAC, GAT, GCG, TTC, TGG, GAC, GAG, CTG, TTG, AAA, GTG, CGT, GGC, GAA, GTG, AAC, AAA, GTC, ATT, GAG, CAA, GCG, CGT, GCC, GAT, AAG, AAC, GTG, GGC, GGC, TCG, CTG, GAA, GCG, GCA, GTA, ACC, TTG, TAT, GCA, GAA, CCG, GAA, CTG, GCG, GCG, AAA, CTG, ACC, GCG, CTG, GGC, GAT, GAA, TTA, CGA, TTT, GTC, CTG, TTG, ACC, TCC, GGC, GCT, ACC, GTT, GCA, GAC, TAT, AAC, GAC, GCA, CCT, GCT, GAT, GCC, CAG, CAG, AGC, GAA, GTC, CTC, AAA, GGG, CTG, AAA, GTC, GCG, TTG, AGT, AAA, GCC, GAA, GGT, GAG, AAG, TGT, CCT, CGC, TGC, TGG, CAC, TAC, ACC, CAG, GAT, GTC, GGC, AAG, GTG, GCG, GAA, CAC, GCA, GAA, ATC, TGC, GGC, CGC, TGT, GTC, AGC, AAC, GTC, GCC, GGT, GAC, GGT, GAA, AAA, CGT, AAG, TTT, GCC, TGA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
||||||
|
Region Name: Non-protein region
|
||||||
|
Nucleotides: GCTTGCGCCAACGCCATTTCATCGCCATCCCGCCGAGCATACAGGCCTCGGAAGAACCAATGGTGTTGGTGCCAACGGCCTGACCATTTTTCGGTGCAGGCGCATGCCACAGATCGGCAACCATGTTTACGCAACGCAGATCGATTGCTGCAGATTGCGGATATTCTTCTTTGTCGATCCAGTTTTTGTTAATGGATAAATCCA
|
||||||
|
Nuc. Counts: [46, 56, 49, 53]
|
||||||
|
Total Mass%: [23.5, 23.5, 28.0, 25.0] of 26473.6
|
||||||
|
Codons List: [GCT, TGC, GCC, AAC, GCC, ATT, TCA, TCG, CCA, TCC, CGC, CGA, GCA, TAC, AGG, CCT, CGG, AAG, AAC, CAA, TGG, TGT, TGG, TGC, CAA, CGG, CCT, GAC, CAT, TTT, TCG, GTG, CAG, GCG, CAT, GCC, ACA, GAT, CGG, CAA, CCA, TGT, TTA, CGC, AAC, GCA, GAT, CGA, TTG, CTG, CAG, ATT, GCG, GAT, ATT, CTT, CTT, TGT, CGA, TCC, AGT, TTT, TGT, TAA, TGG, ATA, AAT, CCA]
|
||||||
|
Is Protein?: NO
|
||||||
|
|
||||||
|
Region Name: FKBP-type 16 kDa peptidyl-prolyl cis-trans isomerase
|
||||||
|
Nucleotides: ATGTCTGAATCTGTACAGAGCAATAGCGCCGTCCTGGTGCACTTCACGCTAAAACTCGACGATGGCACCACCGCTGAGTCTACCCGCAACAACGGTAAACCGGCGCTGTTCCGCCTGGGTGATGCTTCTCTTTCTGAAGGGCTGGAGCAACACCTGCTGGGGCTGAAAGTGGGCGATAAAACCACCTTCTCGCTGGAGCCAGATGCGGCGTTTGGCGTGCCGTCACCGGACCTGATTCAGTACTTCTCCCGCCGTGAATTTATGGATGCAGGCGAGCCAGAAATTGGCGCAATCATGCTTTTTACCGCAATGGATGGCAGTGAGATGCCTGGCGTGATCCGCGAAATTAACGGCGACTCCATTACCGTTGATTTCAACCATCCGCTGGCCGGGCAGACCGTTCATTTTGATATTGAAGTGCTGGAAATCGATCCGGCACTGGAGGCGTAA
|
||||||
|
Nuc. Counts: [100, 121, 125, 104]
|
||||||
|
Total Mass%: [23.0, 22.8, 32.1, 22.1] of 58858.4
|
||||||
|
Codons List: [ATG, TCT, GAA, TCT, GTA, CAG, AGC, AAT, AGC, GCC, GTC, CTG, GTG, CAC, TTC, ACG, CTA, AAA, CTC, GAC, GAT, GGC, ACC, ACC, GCT, GAG, TCT, ACC, CGC, AAC, AAC, GGT, AAA, CCG, GCG, CTG, TTC, CGC, CTG, GGT, GAT, GCT, TCT, CTT, TCT, GAA, GGG, CTG, GAG, CAA, CAC, CTG, CTG, GGG, CTG, AAA, GTG, GGC, GAT, AAA, ACC, ACC, TTC, TCG, CTG, GAG, CCA, GAT, GCG, GCG, TTT, GGC, GTG, CCG, TCA, CCG, GAC, CTG, ATT, CAG, TAC, TTC, TCC, CGC, CGT, GAA, TTT, ATG, GAT, GCA, GGC, GAG, CCA, GAA, ATT, GGC, GCA, ATC, ATG, CTT, TTT, ACC, GCA, ATG, GAT, GGC, AGT, GAG, ATG, CCT, GGC, GTG, ATC, CGC, GAA, ATT, AAC, GGC, GAC, TCC, ATT, ACC, GTT, GAT, TTC, AAC, CAT, CCG, CTG, GCC, GGG, CAG, ACC, GTT, CAT, TTT, GAT, ATT, GAA, GTG, CTG, GAA, ATC, GAT, CCG, GCA, CTG, GAG, GCG, TAA]
|
||||||
|
Is Protein?: YES
|
||||||
|
|
Binary file not shown.
Loading…
Reference in New Issue