001/* 002 * BioJava development code 003 * 004 * This code may be freely distributed and modified under the 005 * terms of the GNU Lesser General Public Licence. This should 006 * be distributed with the code. If you do not have a copy, 007 * see: 008 * 009 * http://www.gnu.org/copyleft/lesser.html 010 * 011 * Copyright for this code is held jointly by the individual 012 * authors. These should be listed in @author doc comments. 013 * 014 * For more information on the BioJava project and its aims, 015 * or to join the biojava-l mailing list, visit the home page 016 * at: 017 * 018 * http://www.biojava.org/ 019 * 020 */ 021package org.biojava.nbio.genome.homology; 022 023import org.biojava.nbio.genome.query.BlastXMLQuery; 024 025import java.io.File; 026import java.util.ArrayList; 027import java.util.LinkedHashMap; 028 029/** 030 * 031 * @author Scooter Willis 032 */ 033public class BlastHomologyHits { 034 035 static public LinkedHashMap<String, ArrayList<String>> getMatches(File xmlBlastHits, double ecutoff) throws Exception { 036 LinkedHashMap<String, ArrayList<String>> homologyHits = new LinkedHashMap<>(); 037 BlastXMLQuery blastXMLQuery = new BlastXMLQuery(xmlBlastHits.getAbsolutePath()); 038 LinkedHashMap<String, ArrayList<String>> hits = blastXMLQuery.getHitsQueryDef(ecutoff); 039 for (String accessionid : hits.keySet()) { 040 String[] data = accessionid.split(" "); // deal with notes/comments in blast results 041 String id = data[0]; 042 ArrayList<String> uniprotProteinHits = hits.get(accessionid); 043 homologyHits.put(id, uniprotProteinHits); 044 045 } 046 return homologyHits; 047 } 048}