001/** 002 * BioJava development code 003 * 004 * This code may be freely distributed and modified under the terms of the GNU 005 * Lesser General Public Licence. This should be distributed with the code. If 006 * you do not have a copy, see: 007 * 008 * http://www.gnu.org/copyleft/lesser.html 009 * 010 * Copyright for this code is held jointly by the individual authors. These 011 * should be listed in @author doc comments. 012 * 013 * For more information on the BioJava project and its aims, or to join the 014 * biojava-l mailing list, visit the home page at: 015 * 016 * http://www.biojava.org/ 017 * 018 * Created on Feb 23, 2012 Created by Andreas Prlic 019 * 020 * @since 3.0.2 021 */ 022package org.biojava.nbio.core.util; 023 024import java.io.File; 025import java.io.FileInputStream; 026import java.io.FileOutputStream; 027import java.io.IOException; 028import java.io.InputStream; 029import java.net.HttpURLConnection; 030import java.net.SocketTimeoutException; 031import java.net.URL; 032import java.net.URLConnection; 033import java.nio.channels.Channels; 034import java.nio.channels.FileChannel; 035import java.nio.channels.ReadableByteChannel; 036import java.nio.file.FileVisitResult; 037import java.nio.file.Files; 038import java.nio.file.Path; 039import java.nio.file.Paths; 040import java.nio.file.SimpleFileVisitor; 041import java.nio.file.attribute.BasicFileAttributes; 042 043import org.slf4j.Logger; 044import org.slf4j.LoggerFactory; 045 046public class FileDownloadUtils { 047 048 private static final Logger logger = LoggerFactory.getLogger(FileDownloadUtils.class); 049 050 /** 051 * Copy the content of file src to dst TODO since java 1.7 this is provided 052 * in java.nio.file.Files 053 * 054 * @param src 055 * @param dst 056 * @throws IOException 057 */ 058 @SuppressWarnings("resource") 059 public static void copy(File src, File dst) throws IOException { 060 061 // Took following recipe from 062 // http://stackoverflow.com/questions/106770/standard-concise-way-to-copy-a-file-in-java 063 // The nio package seems to be the most efficient way to copy a file 064 FileChannel source = null; 065 FileChannel destination = null; 066 067 try { 068 // we need the supress warnings here (the warning that the stream is not closed is harmless) 069 // see http://stackoverflow.com/questions/12970407/does-filechannel-close-close-the-underlying-stream 070 source = new FileInputStream(src).getChannel(); 071 destination = new FileOutputStream(dst).getChannel(); 072 destination.transferFrom(source, 0, source.size()); 073 } finally { 074 if (source != null) { 075 source.close(); 076 } 077 if (destination != null) { 078 destination.close(); 079 } 080 } 081 } 082 083 /** 084 * Gets the file extension of a file, excluding '.'. 085 * If the file name has no extension the file name is returned. 086 * @param f a File 087 * @return The extension 088 */ 089 public static String getFileExtension(File f) { 090 String fileName = f.getName(); 091 String ext = ""; 092 int mid = fileName.lastIndexOf("."); 093 ext = fileName.substring(mid + 1, fileName.length()); 094 return ext; 095 } 096 097 /** 098 * Gets the file name up to and excluding the first 099 * '.' character. If there is no extension, the full filename 100 * is returned. 101 * @param f A file 102 * @return A possibly empty but non-null String. 103 */ 104 public static String getFilePrefix(File f) { 105 String fileName = f.getName(); 106 int mid = fileName.indexOf("."); 107 if (mid < 0) { 108 return fileName; 109 } 110 return fileName.substring(0, mid); 111 } 112 113 /** 114 * Download the content provided at URL url and store the result to a local 115 * file, using a temp file to cache the content in case something goes wrong 116 * in download. A timeout of 60 seconds is hard-coded and 10 retries are attempted. 117 * 118 * @param url 119 * @param destination 120 * @throws IOException 121 */ 122 public static void downloadFile(URL url, File destination) throws IOException { 123 int count = 0; 124 int maxTries = 10; 125 int timeout = 60000; //60 sec 126 127 File tempFile = File.createTempFile(getFilePrefix(destination), "." + getFileExtension(destination)); 128 129 // Took following recipe from stackoverflow: 130 // http://stackoverflow.com/questions/921262/how-to-download-and-save-a-file-from-internet-using-java 131 // It seems to be the most efficient way to transfer a file 132 // See: http://docs.oracle.com/javase/7/docs/api/java/nio/channels/FileChannel.html 133 ReadableByteChannel rbc = null; 134 FileOutputStream fos = null; 135 while (true) { 136 try { 137 URLConnection connection = prepareURLConnection(url.toString(), timeout); 138 connection.connect(); 139 InputStream inputStream = connection.getInputStream(); 140 141 rbc = Channels.newChannel(inputStream); 142 fos = new FileOutputStream(tempFile); 143 fos.getChannel().transferFrom(rbc, 0, Long.MAX_VALUE); 144 break; 145 } catch (SocketTimeoutException e) { 146 if (++count == maxTries) throw e; 147 } finally { 148 if (rbc != null) { 149 rbc.close(); 150 } 151 if (fos != null) { 152 fos.close(); 153 } 154 } 155 } 156 157 logger.debug("Copying temp file {} to final location {}", tempFile, destination); 158 copy(tempFile, destination); 159 160 // delete the tmp file 161 tempFile.delete(); 162 163 } 164 165 /** 166 * Converts path to Unix convention and adds a terminating slash if it was 167 * omitted. 168 * 169 * @param path original platform dependent path 170 * @return path in Unix convention 171 * @author Peter Rose 172 * @since 3.2 173 */ 174 public static String toUnixPath(String path) { 175 String uPath = path; 176 if (uPath.contains("\\")) { 177 uPath = uPath.replaceAll("\\\\", "/"); 178 } 179 // this should be removed, it's need since "\" is added AtomCache code 180 if (uPath.endsWith("//")) { 181 uPath = uPath.substring(0, uPath.length() - 1); 182 } 183 if (!uPath.endsWith("/")) { 184 uPath = uPath + "/"; 185 } 186 return uPath; 187 } 188 189 /** 190 * Expands ~ in paths to the user's home directory. 191 * 192 * <p> 193 * This does not work for some special cases for paths: Other users' homes 194 * (~user/...), and Tilde expansion within the path (/.../~/...). In these cases 195 * the original argument is returned. 196 * 197 * @param file A filepath starting with a tilde 198 * @return An absolute path 199 */ 200 public static String expandUserHome(String file) { 201 // replace any / with the proper separator (/ or \ for Linux and Windows respectively). 202 file = file.replaceAll("/", "\\"+File.separator); //The "\\" is to escape the separator if needed. 203 if (file.startsWith("~" + File.separator)) { 204 file = System.getProperty("user.home") + file.substring(1); 205 } 206 return file; 207 } 208 209 /** 210 * Pings a HTTP URL. This effectively sends a HEAD request and returns 211 * <code>true</code> if the response code is in the 200-399 range. 212 * 213 * @param url The HTTP URL to be pinged. 214 * @param timeout The timeout in millis for both the connection timeout and 215 * the response read timeout. Note that the total timeout is effectively two 216 * times the given timeout. 217 * @return <code>true</code> if the given HTTP URL has returned response 218 * code 200-399 on a HEAD request within the given timeout, otherwise 219 * <code>false</code>. 220 * @author BalusC, 221 * http://stackoverflow.com/questions/3584210/preferred-java-way-to-ping-a-http-url-for-availability 222 */ 223 public static boolean ping(String url, int timeout) { 224 //url = url.replaceFirst("https", "http"); // Otherwise an exception may be thrown on invalid SSL certificates. 225 226 try { 227 HttpURLConnection connection = (HttpURLConnection) prepareURLConnection(url, timeout); 228 connection.setRequestMethod("HEAD"); 229 int responseCode = connection.getResponseCode(); 230 return (200 <= responseCode && responseCode <= 399); 231 } catch (IOException exception) { 232 return false; 233 } 234 } 235 236 /** 237 * Prepare {@link URLConnection} with customised timeouts. 238 * 239 * @param url The URL 240 * @param timeout The timeout in millis for both the connection timeout and 241 * the response read timeout. Note that the total timeout is effectively two 242 * times the given timeout. 243 * 244 * <p> 245 * Example of code. <code> 246 * UrlConnection conn = prepareURLConnection("http://www.google.com/", 20000); 247 * conn.connect(); 248 * conn.getInputStream(); 249 * </code> 250 * <p> 251 * 252 * <bold>NB. User should execute connect() method before getting input 253 * stream.</bold> 254 * @return 255 * @throws IOException 256 * @author Jacek Grzebyta 257 */ 258 public static URLConnection prepareURLConnection(String url, int timeout) throws IOException { 259 URLConnection connection = new URL(url).openConnection(); 260 connection.setReadTimeout(timeout); 261 connection.setConnectTimeout(timeout); 262 return connection; 263 } 264 265 /** 266 * Recursively delete a folder & contents 267 * 268 * @param dir directory to delete 269 */ 270 public static void deleteDirectory(Path dir) throws IOException { 271 if(dir == null || !Files.exists(dir)) 272 return; 273 Files.walkFileTree(dir, new SimpleFileVisitor<Path>() { 274 @Override 275 public FileVisitResult visitFile(Path file, BasicFileAttributes attrs) throws IOException { 276 Files.delete(file); 277 return FileVisitResult.CONTINUE; 278 } 279 280 @Override 281 public FileVisitResult postVisitDirectory(Path dir, IOException e) throws IOException { 282 if (e != null) { 283 throw e; 284 } 285 Files.delete(dir); 286 return FileVisitResult.CONTINUE; 287 } 288 }); 289 } 290 /** 291 * Recursively delete a folder & contents 292 * 293 * @param dir directory to delete 294 */ 295 public static void deleteDirectory(String dir) throws IOException { 296 deleteDirectory(Paths.get(dir)); 297 } 298 299 300 public static void main(String[] args) { 301 String url; 302 url = "http://scop.mrc-lmb.cam.ac.uk/scop/parse/"; 303 System.out.format("%s\t%s%n", ping(url, 200), url); 304 url = "http://scop.mrc-lmb.cam.ac.uk/scop/parse/foo"; 305 System.out.format("%s\t%s%n", ping(url, 200), url); 306 url = "http://scopzzz.mrc-lmb.cam.ac.uk/scop/parse/"; 307 System.out.format("%s\t%s%n", ping(url, 200), url); 308 url = "scop.mrc-lmb.cam.ac.uk"; 309 System.out.format("%s\t%s%n", ping(url, 200), url); 310 url = "http://scop.mrc-lmb.cam.ac.uk"; 311 System.out.format("%s\t%s%n", ping(url, 200), url); 312 } 313 314}