Skip to content

Latest commit

 

History

History
52 lines (41 loc) · 1.98 KB

File metadata and controls

52 lines (41 loc) · 1.98 KB
title BioJava:CookBook3:MSA
permalink wiki/BioJava%3ACookBook3%3AMSA

How to create a Multiple Sequence Alignment in BioJava

package org.biojava.nbio.alignment;

import java.net.URL; import java.util.ArrayList; import java.util.List;

import org.biojava.nbio.alignment.Alignments; import
org.biojava.nbio.alignment.template.Profile; import
org.biojava.nbio.core.sequence.ProteinSequence; import
org.biojava.nbio.core.sequence.compound.AminoAcidCompound; import
org.biojava.nbio.core.sequence.io.FastaReaderHelper; import
org.biojava.nbio.core.util.ConcurrencyTools;

public class CookbookMSA {

   public static void main(String[] args) {  
       String[] ids = new String[] {"Q21691""A8WS47""O48771"};  
       try {  
           multipleSequenceAlignment(ids);  
       } catch (Exception e){  
           e.printStackTrace();  
       }  
   }

   private static void multipleSequenceAlignment(String[] idsthrows Exception {  
       List<ProteinSequencelst = new ArrayList<ProteinSequence>();  
       for (String id : ids) {  
           lst.add(getSequenceForId(id));  
       }  
       Profile<ProteinSequence, AminoAcidCompoundprofile = Alignments.getMultipleSequenceAlignment(lst);  
       System.out.printf("Clustalw:%n%s%n"profile);  
       ConcurrencyTools.shutdown();  
   }

   private static ProteinSequence getSequenceForId(String uniProtIdthrows Exception {  
       URL uniprotFasta = new URL(String.format("http://www.uniprot.org/uniprot/%s.fasta"uniProtId));  
       ProteinSequence seq = FastaReaderHelper.readFastaProteinSequence(uniprotFasta.openStream()).get(uniProtId);  
       System.out.printf("id : %s %s%n%s%n"uniProtIdseqseq.getOriginalHeader());  
       return seq;  
   }

}