001/**
002 *                    BioJava development code
003 *
004 * This code may be freely distributed and modified under the
005 * terms of the GNU Lesser General Public Licence.  This should
006 * be distributed with the code.  If you do not have a copy,
007 * see:
008 *
009 *      http://www.gnu.org/copyleft/lesser.html
010 *
011 * Copyright for this code is held jointly by the individual
012 * authors.  These should be listed in @author doc comments.
013 *
014 * For more information on the BioJava project and its aims,
015 * or to join the biojava-l mailing list, visit the home page
016 * at:
017 *
018 *      http://www.biojava.org/
019 *
020 * Created on Feb 22, 2012
021 * Created by Andreas Prlic
022 *
023 * @since 3.0.2
024 */
025package org.biojava.nbio.structure.io.sifts;
026
027import org.biojava.nbio.structure.align.util.AtomCache;
028import org.biojava.nbio.core.util.FileDownloadUtils;
029import org.biojava.nbio.core.util.InputStreamProvider;
030import org.slf4j.Logger;
031import org.slf4j.LoggerFactory;
032
033import java.io.File;
034import java.io.IOException;
035import java.io.InputStream;
036import java.net.URL;
037import java.util.List;
038
039public class SiftsMappingProvider {
040
041        private final static Logger logger = LoggerFactory.getLogger(SiftsMappingProvider.class);
042
043
044        private static final String EBI_SIFTS_FILE_LOCATION = "https://ftp.ebi.ac.uk/pub/databases/msd/sifts/xml/%s.xml.gz";
045
046        private static String fileLoc = EBI_SIFTS_FILE_LOCATION;
047
048        public static void setFileLocation(String myFileLocation){
049                fileLoc = myFileLocation;
050        }
051
052        /**
053         * Return the SIFTS mappings by getting the info from individual SIFTS xml files at URL {@value EBI_SIFTS_FILE_LOCATION}
054         * @param pdbId the pdb identifier
055         * @return
056         * @throws IOException if problems downloading or parsing the file
057         */
058        public static List<SiftsEntity> getSiftsMapping(String pdbId) throws IOException{
059                // grab files from here:
060
061                AtomCache cache = new AtomCache();
062
063                String path = cache.getCachePath();
064
065                pdbId = pdbId.toLowerCase();
066
067                String dirHash = pdbId.substring(1,3);
068                File siftsDir = new File(path , "SIFTS");
069
070
071                if ( ! siftsDir.exists()) {
072                        logger.info("Creating directory {}", siftsDir.toString());
073                        siftsDir.mkdir();
074                }
075
076                File hashDir = new File(siftsDir, dirHash);
077
078                if ( ! hashDir.exists()){
079                        logger.info("Creating directory {}", hashDir.toString());
080                        hashDir.mkdir();
081                }
082                File dest = new File( hashDir, pdbId + ".sifts.xml.gz");
083
084                logger.debug("testing SIFTS file {}", dest.getAbsolutePath());
085
086
087                if ( ! dest.exists()){
088                        String u = String.format(fileLoc,pdbId);
089                        URL url = new URL(u);
090                        logger.debug("Downloading SIFTS file {} validation metadata.",url);
091                        FileDownloadUtils.createValidationFiles(url, dest, null, FileDownloadUtils.Hash.UNKNOWN);
092                        logger.debug("Downloading SIFTS file {} to {}",url,dest);
093                        FileDownloadUtils.downloadFile(url, dest);
094                }
095
096                if(! FileDownloadUtils.validateFile(dest))
097                        throw new IOException("Downloaded file invalid: "+dest);
098
099                InputStreamProvider prov = new InputStreamProvider();
100                InputStream is = prov.getInputStream(dest);
101                SiftsXMLParser parser = new SiftsXMLParser();
102
103                parser.parseXmlFile(is);
104
105                //System.out.println(parser.getEntities());
106                return parser.getEntities();
107
108
109        }
110
111
112}