Skip to content
Snippets Groups Projects
IndexFastaStream.java 6.36 KiB
Newer Older
  • Learn to ignore specific revisions
  • tjc's avatar
    tjc committed
    /* 
     * created: 2010
     *
     * This file is part of Artemis
     *
     * Copyright(C) 2010  Genome Research Limited
     *
     * This program is free software; you can redistribute it and/or
     * modify it under the terms of the GNU General Public License
     * as published by the Free Software Foundation; either version 2
     * of the License, or(at your option) any later version.
     *
     * This program is distributed in the hope that it will be useful,
     * but WITHOUT ANY WARRANTY; without even the implied warranty of
     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     * GNU General Public License for more details.
     *
     * You should have received a copy of the GNU General Public License
     * along with this program; if not, write to the Free Software
     * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
     *
     */
    package uk.ac.sanger.artemis.io;
    
    import java.io.File;
    import java.io.IOException;
    import java.io.Writer;
    import java.util.Iterator;
    
    
    tjc's avatar
    tjc committed
    import javax.swing.JOptionPane;
    
    
    tjc's avatar
    tjc committed
    import net.sf.picard.reference.FastaSequenceIndex;
    import net.sf.picard.reference.IndexedFastaSequenceFile;
    import net.sf.picard.reference.ReferenceSequence;
    
    tjc's avatar
    tjc committed
    import net.sf.picard.reference.ReferenceSequenceFileFactory;
    
    tjc's avatar
    tjc committed
    
    
    tjc's avatar
    tjc committed
    import uk.ac.sanger.artemis.io.Entry;
    import uk.ac.sanger.artemis.Options;
    import uk.ac.sanger.artemis.components.EntryFileDialog;
    
    tjc's avatar
    tjc committed
    import uk.ac.sanger.artemis.util.FileDocument;
    
    import uk.ac.sanger.artemis.util.ReadOnlyException;
    
    tjc's avatar
    tjc committed
    import uk.ac.sanger.artemis.util.URLDocument;
    
    tjc's avatar
    tjc committed
    
    public class IndexFastaStream extends StreamSequence 
    {
      private IndexedFastaSequenceFile indexSeqFile;
      private FastaSequenceIndex fastaIndex;
      private int len;
      private String contig;
      
      public IndexFastaStream(Entry entry)
      {
    
    tjc's avatar
    tjc committed
        DocumentEntry doc = (DocumentEntry)entry;
        if(doc instanceof URLDocument)
        {
          //URL url = (URL)((URLDocument)doc).getLocation();
          // not supported yet
        }
        else
        {
          File fasta = ((FileDocument)doc.getDocument()).getFile();
          File fastaIndexFile = new File(fasta.getParentFile().getAbsolutePath(), fasta.getName()+".fai");
          fastaIndex = new FastaSequenceIndex(fastaIndexFile);
    
    tjc's avatar
    tjc committed
          
          try
          {
            indexSeqFile = new IndexedFastaSequenceFile(fasta, fastaIndex);
          }
          catch(IllegalArgumentException ie)
          {
            JOptionPane.showConfirmDialog(null, 
                "Expecting fasta extensions:\n"+
                ReferenceSequenceFileFactory.FASTA_EXTENSIONS.toString()+
                "\n"+ie.getMessage(), 
                "Error", JOptionPane.ERROR_MESSAGE);
          }
    
    tjc's avatar
    tjc committed
        }
        
    
    tjc's avatar
    tjc committed
        setContigByIndex(0);
      }
      
      /**
       * Test if the entry contains an indexed sequence
       * @param entry
       * @return
       */
      public static boolean isIndexed(Entry entry)
      {
        if( entry instanceof DocumentEntry && 
            ((DocumentEntry)entry).getDocument() instanceof FileDocument)
        {
          File fasta = ((FileDocument)((DocumentEntry)entry).getDocument()).getFile();
          File fastaIndexFile = new File(fasta.getParentFile().getAbsolutePath(), fasta.getName()+".fai");
          if(fastaIndexFile.exists())
            return true;
        }
        return false;
      }
      
      public void setContigByIndex(int seqIndex) 
      {
        /*ReferenceSequence ref = getReferenceSequence(seqIndex);
        len = ref.length();
        contig = ref.getName();*/
        
        len = getLengthByIndex(seqIndex);
        contig = getContigByIndex(seqIndex);
      }
    
      /**
       *  Return a the given range of bases as a String.  Returns an empty
       *  sequence if the end position is less than the start position.
       *  @param start The start base of the range.
       *  @param end The end base of the range.
       **/
      public String getSubSequence(int start, int end) 
      {
    
    tjc's avatar
    tjc committed
        byte b[] = indexSeqFile.getSubsequenceAt(contig, start, end).getBases();
        return new String(b).toLowerCase();
    
    tjc's avatar
    tjc committed
      }
      
      public char[] getCharSubSequence(int start, int end) 
      {
        return getSubSequence(start, end).toCharArray();
      }
      
      private int getLengthByIndex(int seqIndex)
      {
        Iterator it = fastaIndex.iterator();
        int i = 0;
        while(it.hasNext())
        {
          Object obj = it.next();
          if(i == seqIndex)
          {
            String size = obj.toString().split(";")[2].substring(5).trim();
            return Integer.parseInt(size);
          }
          i++;
        }
        return -1;
      }
      
      private String getContigByIndex(int seqIndex)
      {
        Iterator it = fastaIndex.iterator();
        int i = 0;
        while(it.hasNext())
        {
          Object obj = it.next();
          if(i == seqIndex)
            return obj.toString().split(";")[0].substring(6).trim();
          i++;
        }
        return null;
      }
      
      public ReferenceSequence getReferenceSequence(int seqIndex)
      {
        int i = 0;
        ReferenceSequence ref;
        indexSeqFile.reset();
        while( (ref=indexSeqFile.nextSequence()) != null ) 
        {  
          if(i == seqIndex)
            return ref;
           i++;
        }
        return null;
      }
      
    
      /**
       *  Returns the length of the sequence in bases.
       **/
      public int length() 
      {
        return len;
      }
      
      @Override
      public StreamSequence copy()
      {
        // TODO Auto-generated method stub
        return null;
      }
    
      @Override
      public int getFormatType()
      {
        return StreamSequenceFactory.INDEXED_FASTA_FORMAT;
      }
    
      
      public void setFromChar(final char dna[])
      {
        JOptionPane.showMessageDialog(null,"Read only sequence.", 
            "Warning", JOptionPane.WARNING_MESSAGE);
        throw new RuntimeException(new ReadOnlyException());
      }
    
    tjc's avatar
    tjc committed
    
      @Override
      public void writeToStream(Writer writer) throws IOException
      {
        // TODO Auto-generated method stub
      }
      
      public IndexedFastaSequenceFile getIndexSeqFile()
      {
        return indexSeqFile;
      }
      
      public FastaSequenceIndex getFastaIndex()
      {
        return fastaIndex;
      }
    
    tjc's avatar
    tjc committed
      
      public static void main(String args[])
      {
        EntryInformation new_entry_information =
          new SimpleEntryInformation(Options.getArtemisEntryInformation());
    
        try
        {
          Entry emblEntry = null;
          if(args[0].startsWith("http:"))
          {
            
            
          }
          else
          {
            final uk.ac.sanger.artemis.Entry entry =  
              new uk.ac.sanger.artemis.Entry(EntryFileDialog.getEntryFromFile(
                        null, new FileDocument(new File(args[0])),
                        new_entry_information, true));
            emblEntry = entry.getEMBLEntry();
          }
          
          IndexFastaStream istream = new IndexFastaStream(emblEntry);
          System.out.println(istream.getCharSubSequence(1, 8000));
        }
        catch (Exception e)
        {
          e.printStackTrace();
        }
      }
    
    tjc's avatar
    tjc committed
    }