DNA Repeats start.pde

From dftwiki3
Revision as of 13:30, 24 July 2008 by Thiebaut (talk | contribs) (New page: Back to Lab 4 <hr /> <code><pre> // DNA3.pde // D. Thiebaut // Finding repeats in DNA sequence //--------------------------------------------------------------------- /...)
(diff) ← Older revision | Latest revision (diff) | Newer revision → (diff)
Jump to: navigation, search

Back to Lab 4


// DNA3.pde
// D. Thiebaut
// Finding repeats in DNA sequence

//---------------------------------------------------------------------
//  ___ _     _          _    
// / __| |___| |__  __ _| |___
//| (_ | / _ \ '_ \/ _` | (_-<
// \___|_\___/_.__/\__,_|_/__/
//
//---------------------------------------------------------------------
DNAString dna1;

String FASTA0 = "gi|194306025|dbj|AB426820.1| Escherichia coli ompT mRNA for outer membrane protease T, partial cds, strain: JCM 5491\n"
+"TGGGAATAGTCCTGACAACCCCTATTGCGATCAGCTCTTTTGCTTCTACCGAGACTTTATCGTTTACTCC"
+"TGACAACATAAATGCGGACATTAGTCTTGGAACTCTGAGCGGAAAAACAAAAGAGCGTGTTTATCTAGCC"
+"GAAGAAGGAGGCCGAAAGGTCAGTCAACTTGACTGGAAATTCAATAACGCTGCAATTATTAAAGGTGCAA"
+"TTAATTGGGATTTGATGCCCCAGATATCTATCGGGGCTGCTGGCTGGACAACTCTCGGTAGCCGAGGTGG"  
+"CAATATGGTCGATCGGGACTGGATGGATTCCAGTAACCCCGGAACCTGGACGGATGAAAGTAGACACCCT"
+"GATACACAACTCAATTATGCCAACGAATTTGATCTGAATATCAGAGGCTGGCTCCCCAACGAACCCAATT"
+"ACCGCCTGGGACTCATGGCCGGATATCAGGAAAGCCGTTATAGCTTTACAGCCAGAGGGGGTTCCTATAT"
+"CTACAGTTCTGAGGAGGGATTCAGAGATGATATCGGCTCCTTCCCGAATGGAGAAAGAGCAATCGGCTAC"
+"AAACAACGTTTTAAAATGCCCTACATTGGCTTGACTGGAAGTTATCGTTATGAAGATTTTGAGCTAGGTG"
+"GTACATTTAAATACAGCGGCTGGGTGGAAGCATTTGATAACGATGAACACTATGACCCAGGAAAAAGAAT"
+"CACTTATCGCAGTAAAGTCAAAGACCAAAATTACTATTCTGTTGCAGTCAATGCAGGTTATTACGTAACG"
+"CCTAATGCAAAAGTTTATATTGAAGGCGCATGGAATCGGGTTACGAATAAAAAAGGTGATACTTCACTTT"
+"ATGATCACAATGATAACACTTCTGACTACAGCAAAAATGGTGCAGGCATAGAAAACTATAACTTCATCAC"
+"TACTGCTGGTC";

String FASTA3 = "gi|194306025|dbj|AB426820.1| Escherichia coli ompT mRNA for outer membrane protease T, partial cds, strain: JCM 5491\n"
+"TGGGAATAGTCCTGACAACCCCTATTGCGATCAGCTCTTTTGCTTCTACCGAGACTTTATCGTTTACTCC"
+"TGACAACATAAATGCGGACATTAGTCTCTGACAACCCCTATTGGAAACAAAAGAGCGTGTTTATCTAGCC"
+"GAAGAAGGAGGCCGAAAGGTCAGTCAACTTGACTGGAAATTCAATAACGCTGCAATTATTAAAGGTGCAA"
+"TTAATTGGGATTTGATGCCCCAGATATCTATCGGGGCTGCTGGCTGGACAACTCTCGGTAGCCGAGGTGG"  
+"CAATATGGTCGATCGGGACTGGATGGATTCCAGTAACCCCGGAACCTGGACGGATGAAAGTAGACACCCT"
+"GATACACAACTCAATTATGCCAACGAATTTGATCTGAATATCAGAGGCTGGCTCCCCAACGAACCCAATT"
+"ACCGCCTGGGACTCATGGCCGGATATCAGGAAAGCCGTTATAGCTTTACAGCCAGAGGGGGTTCCTATAT"
+"CTACAGTTCTGAGGAGGGATTCAGAGATGATATCGGCTCCTTCCCGAATGGAGAAAGAGCAATCGGCTAC"
+"AAACAACGTTTTAAAATGCCCTACATTGGCTTGACTGGAAGTTATCGTTATGAAGATTTTGAGCTAGGTG"
+"GTACATTTAAATACAGCGGCTGGGTGGAAGCATTTGATAACGATGAACACTATGACCCAGGAAAAAGAAT"
+"CACTTATCGCAGTAAAGTCAAAGACCAAAATTACTATTCTGTTGCAGTCAATGCAGGTTATTACGTAACG"
+"CCTAATGCAAAAGTTTATATTGAAGGCGCATGGAATCGGGTTACGAATAAAAAAGGTGATACTTCACTTT"
+"ATGATCACAATGATAACACTTCTGACTACAGCAAAAATGGTGCAGGCATAGAAAACTATAACTTCATCAC"
+"TACTGCTGGTC";

String FASTA1 = "gi|194306025|dbj|AB426820.1| Escherichia coli ompT mRNA for outer membrane protease T, partial cds, strain: JCM 5491\n"
+"TGGGAATAGTCCTGACAACCCCTATTGCGATCAGCTCTTTTGCTTCTACCGAGACTTTATCGTTTACTCC";

String FASTA2 = "gi|194306025|dbj|AB426820.1| Escherichia coli ompT mRNA for outer membrane protease T, partial cds, strain: JCM 5491\n"
+"TGACAACATAAATGCGGACATTAGTCTTGGAACTCTGAGCGGAAAAACAAAAGAGCGTGTTTATCTAGCC";

//---------------------------------------------------------------------
// GEOMETRY
//---------------------------------------------------------------------
int WIDTH        = 800;
int MIDWIDTH     = WIDTH/2;
int HEIGHT       = 600;
int BORDER       = 10;
int TITLELINE    = 20;
int ALINE        = 30;
int SQRTOPX      = BORDER;
int SQRTOPY      = 120;
int SQRWIDTH     = min( HEIGHT-BORDER-SQRTOPY, WIDTH-BORDER*2);
int SQRHEIGHT    = SQRWIDTH;
PFont font;                          // the font used to display the symbols



//---------------------------------------------------------------------
// ___  _  _   _   ___ _       _           
//|   \| \| | /_\ / __| |_ _ _(_)_ _  __ _ 
//| |) | .` |/ _ \\__ \  _| '_| | ' \/ _` |
//|___/|_|\_/_/ \_\___/\__|_| |_|_||_\__, |
//                                   |___/ 
// DNAString Class: a class holding a DNA sequence, both as a text string
// and as an array of DNASymbol objects.
//---------------------------------------------------------------------
class DNAString {
  String symbols;     // the string of chars
  int noSymbols;      // the # of symbols
  int offsetX;        // x-value of left-most position on screen
  int offsetY;        // y-value of screen position
  int displayWidth;
  int displayHeight;

  //--- default constructor ---
  DNAString( ) {      
    symbols = "";
    noSymbols = 0;
  }

  //--- constructor ---
  DNAString( String fastaString ) {
    String[] list = split( fastaString, '\n' );
    symbols = list[1];
    noSymbols = symbols.length();
  }    

  void setBoundingBox( int x, int y, int w, int h ) {
    offsetX = x;
    offsetY = y;
    displayWidth = w;
    displayHeight = h;  
  }

  //--- returns the string of symbols ---
  String getText() {  
    return symbols;
  }

  int length() {
    return noSymbols;
  }

  void truncate( int n ) {
    if ( n < noSymbols ) {
      symbols = symbols.substring( 0, n );
      noSymbols = symbols.length();
    }  
  }

  //--- display text using default method ---
  void drawText() {   
    color myColor = color( 204, 99, 66 );
    fill( myColor );
    text( symbols, offsetX, offsetY, displayWidth, displayHeight );
  }


  //--- erase the symbols and the legs, if any ---
  void erase() {
    int tw = int( textWidth( "A" ) );
    fill( 0 );
    stroke( 0 );
    rect( BORDER*2, ALINE-12, noSymbols*tw, 12 );
  }
}


//---------------------------------------------------------------------
// ___             _   _             
//| __|  _ _ _  __| |_(_)___ _ _  ___
//| _| || | ' \/ _|  _| / _ \ ' \(_-<
//|_| \_,_|_||_\__|\__|_\___/_||_/__/
//---------------------------------------------------------------------

//---------------------------------------------------------------------
// INITFONT: initialize the fonts (must be nonproportional ---
//---------------------------------------------------------------------
void initFont( ) {  
  font = loadFont( "Monaco-12.vlw" );
  textFont( font );
}

//---------------------------------------------------------------------
// INITWINDOW: Draw the fixed text in the window
//---------------------------------------------------------------------
void initWindow( String title ) {
  color myColor = color( 99, 66, 204 );
  fill( myColor );
  text( title, BORDER, TITLELINE );
  textSize( 12 );
  //text( "A:", BORDER, ALINE );   
  stroke( myColor ); 
  line( SQRTOPX, SQRTOPY, SQRTOPX+SQRWIDTH, SQRTOPY );
  line( SQRTOPX+SQRWIDTH, SQRTOPY, SQRTOPX+SQRWIDTH, SQRTOPY+SQRHEIGHT );
  line( SQRTOPX+SQRWIDTH, SQRTOPY+SQRHEIGHT, SQRTOPX, SQRTOPY+SQRHEIGHT );
  line( SQRTOPX, SQRTOPY+SQRHEIGHT, SQRTOPX, SQRTOPY );

}

//---------------------------------------------------------------------
// SETUP: <=== STARTUP POINT.  PROCESSING STARTS HERE!!!
//---------------------------------------------------------------------
void setup() {
  size( WIDTH, HEIGHT );
  initFont();
  background( 0 );
  noStroke();   

  //--- initialize the window ---
  initWindow( "DNA Repeats" );

  //--- create the first DNA string, and position it in window ---
  dna1 = new DNAString( FASTA3 );
  dna1.truncate( SQRWIDTH-1 );
  dna1.setBoundingBox( BORDER, ALINE, WIDTH-2*BORDER, SQRTOPY-ALINE );
  dna1.drawText();
  findRepeats( 5 );    
}

//---------------------------------------------------------------------
// DRAW:  This is called many times a second.  Use it to do animation.
//---------------------------------------------------------------------
void draw() {
}

//---------------------------------------------------------------------
//---------------------------------------------------------------------
void drawPoints( int i, int j, int n ) {
  color myColor = color( 66, 204, 99 );
  fill( myColor );
  stroke( myColor );
  for ( int k=0; k<n; k++ )
    point( SQRTOPX+1+i-k, SQRTOPY+1+j-k );
}

//---------------------------------------------------------------------
// FINDREPEATS:  <== this is where the important work is 
//                               done, finding repeating patterns.
//---------------------------------------------------------------------
void findRepeats( int threshold ) {

    // add your code here...

}

//---------------------------------------------------------------------
// KEYPRESSED(): called every time a key is pressed.  
//---------------------------------------------------------------------
void  keyPressed() {
}












Back to Lab 4