001/* 002 * BioJava development code 003 * 004 * This code may be freely distributed and modified under the 005 * terms of the GNU Lesser General Public Licence. This should 006 * be distributed with the code. If you do not have a copy, 007 * see: 008 * 009 * http://www.gnu.org/copyleft/lesser.html 010 * 011 * Copyright for this code is held jointly by the individual 012 * authors. These should be listed in @author doc comments. 013 * 014 * For more information on the BioJava project and its aims, 015 * or to join the biojava-l mailing list, visit the home page 016 * at: 017 * 018 * http://www.biojava.org/ 019 * 020 */ 021package org.biojava.nbio.structure.quaternary; 022 023import org.biojava.nbio.structure.*; 024 025import java.util.ArrayList; 026import java.util.Arrays; 027import java.util.List; 028 029import javax.vecmath.Point3d; 030 031 032 033 034 035/** 036 * @author Peter Rose 037 * 038 * 039 */ 040public class BioAssemblyTools { 041 042 043 /** 044 * Checks if the passed in expression is a unary operator expression 045 * Example: (1,2,3) or (1-60) are unary operator expressions 046 * (1-60)(61-88) is a binary operator expression, representing 047 * a cartesian product of the two parenthesised lists 048 * 049 * @param expression 050 * @return true if expression is a unary operator expression 051 */ 052 public static boolean isUnaryExpression(String expression) { 053 int first = expression.indexOf("("); 054 int last = expression.lastIndexOf("("); 055 if (first < 0 || last < 0) { 056 return true; 057 } 058 return ! (first == 0 && last > first); 059 } 060 061 public static List<String> parseUnaryOperatorExpression(String operatorExpression) { 062 return parseSubExpression(operatorExpression); 063 } 064 065 private static List<String> parseSubExpression(String expression) { 066 // remove parenthesis, if any 067 String tmp = expression.replace("(", ""); 068 tmp = tmp.replace(")", ""); 069 070 // separate the operators 071 List<String> components = null; 072 try { 073 components = Arrays.asList(tmp.split(",")); 074 } catch (Exception e) { 075 throw new IllegalArgumentException("Invalid oper_expression: " + expression); 076 } 077 078 // expand ranges if present, i.e. 1-60 -> 1, 2, 3, ..., 60 079 List<String> operators = new ArrayList<>(); 080 for (String component : components) { 081 if (component.contains("-")) { 082 operators.addAll(expandRange(component)); 083 } else { 084 operators.add(component); 085 } 086 } 087 return operators; 088 } 089 090 /** 091 * Expands a range expression, i.e. (1-6) to a list 1,2,3,4,5,6 092 * @param expression the expression to be expanded 093 * @return list of items in range 094 * @throws IllegalArgumentException 095 */ 096 private static List<String> expandRange(String expression) { 097 int first = 0; 098 int last = 0; 099 try { 100 String[] range = expression.split("-"); 101 first = Integer.parseInt(range[0]); 102 last = Integer.parseInt(range[1]); 103 } catch (Exception e) { 104 throw new IllegalArgumentException("Invalid range specification in oper_expression: " + expression); 105 } 106 107 List<String> expandedExpression = new ArrayList<>(last-first+1); 108 for (int i = first; i <= last; i++) { 109 expandedExpression.add(String.valueOf(i)); 110 } 111 return expandedExpression; 112 } 113 114 public static List<OrderedPair<String>> parseBinaryOperatorExpression(String expression) 115 { 116 // split operator expression, i.e. (1,2,3)(4,5) into two subexpressions 117 String[] subExpressions = null; 118 try { 119 subExpressions = expression.split("\\)\\("); 120 } catch (Exception e) { 121 throw new IllegalArgumentException("Invalid oper_expression: " + expression); 122 } 123 if (subExpressions.length != 2) { 124 throw new IllegalArgumentException("Invalid oper_expression: " + expression); 125 } 126 List<String> leftSide = parseSubExpression(subExpressions[0]); 127 List<String> rightSide = parseSubExpression(subExpressions[1]); 128 129 // form the cartesian product of the two lists 130 CartesianProduct<String> product = new CartesianProduct<>(leftSide, rightSide); 131 return product.getOrderedPairs(); 132 } 133 134 public static double[][] getBiologicalMoleculeBounds(Structure asymStructure,List<BiologicalAssemblyTransformation> transformations) { 135 final double[][] coordinateBounds = new double[2][3]; 136 coordinateBounds[0][0] = Double.MAX_VALUE; // min x 137 coordinateBounds[0][1] = Double.MAX_VALUE; // min y 138 coordinateBounds[0][2] = Double.MAX_VALUE; // min z 139 coordinateBounds[1][0] = Double.MIN_VALUE; // max x 140 coordinateBounds[1][1] = Double.MIN_VALUE; // max y 141 coordinateBounds[1][2] = Double.MIN_VALUE; // max z 142 143 double[] transformedCoords = new double[3]; 144 145 Atom[] atoms = StructureTools.getAllAtomArray(asymStructure); 146 147 for ( Atom a : atoms) { 148 149 Chain c = a.getGroup().getChain(); 150 String intChainID = c.getId(); 151 152 for (BiologicalAssemblyTransformation m: transformations) { 153 if ( ! m.getChainId().equals(intChainID)) 154 continue; 155 Point3d coords = a.getCoordsAsPoint3d(); 156 transformedCoords[0] = coords.x; 157 transformedCoords[1] = coords.y; 158 transformedCoords[2] = coords.z; 159 160 if (transformedCoords[0] < coordinateBounds[0][0] ) { 161 coordinateBounds[0][0] = transformedCoords[0]; // min x 162 } 163 164 if (transformedCoords[1] < coordinateBounds[0][1] ) { 165 coordinateBounds[0][1] = transformedCoords[1]; // min y 166 } 167 168 if (transformedCoords[2] < coordinateBounds[0][2] ) { 169 coordinateBounds[0][2] = transformedCoords[2]; // min z 170 } 171 172 if (transformedCoords[0] > coordinateBounds[1][0] ) { 173 coordinateBounds[1][0] = transformedCoords[0]; // max x 174 } 175 176 if (transformedCoords[1] > coordinateBounds[1][1] ) { 177 coordinateBounds[1][1] = transformedCoords[1]; // max y 178 } 179 180 if (transformedCoords[2] > coordinateBounds[1][2] ) { 181 coordinateBounds[1][2] = transformedCoords[2]; // max z 182 } 183 } 184 } 185 return coordinateBounds; 186 } 187 public static double[][] getAtomCoordinateBounds(Structure s){ 188 189 Atom[] atoms = StructureTools.getAllAtomArray(s); 190 int atomCount = atoms.length; 191 final double[][] coordinateBounds = new double[2][3]; 192 if ( atomCount <= 0 ) { 193 return coordinateBounds; 194 } 195 196 Atom a = atoms[0]; 197 198 coordinateBounds[0][0] = a.getX(); // min x 199 coordinateBounds[0][1] = a.getY(); // min y 200 coordinateBounds[0][2] = a.getZ(); // min z 201 coordinateBounds[1][0] = a.getX(); // max x 202 coordinateBounds[1][1] = a.getY(); // max y 203 coordinateBounds[1][2] = a.getZ(); // max z 204 205 for ( int i=1; i<atomCount; i++ ) 206 { 207 a =atoms[i]; 208 209 if ( a.getX() < coordinateBounds[0][0] ) { 210 coordinateBounds[0][0] = a.getX(); // min x 211 } 212 213 if ( a.getY() < coordinateBounds[0][1] ) { 214 coordinateBounds[0][1] = a.getY(); // min y 215 } 216 217 if ( a.getZ() < coordinateBounds[0][2] ) { 218 coordinateBounds[0][2] = a.getZ(); // min z 219 } 220 221 if ( a.getX() > coordinateBounds[1][0] ) { 222 coordinateBounds[1][0] = a.getX(); // max x 223 } 224 225 if ( a.getY() > coordinateBounds[1][1] ) { 226 coordinateBounds[1][1] = a.getY(); // max y 227 } 228 229 if ( a.getZ() > coordinateBounds[1][2] ) { 230 coordinateBounds[1][2] = a.getZ(); // max z 231 } 232 } 233 234 return coordinateBounds; 235 } 236 237 /** 238 * Returns the maximum extend of the structure in the x, y, or z direction. 239 * @param structure 240 * @return maximum extend 241 */ 242 public static double getMaximumExtend( final Structure structure ) { 243 double[][] bounds = getAtomCoordinateBounds(structure); 244 double xMax = Math.abs(bounds[0][0] - bounds[1][0]); 245 double yMax = Math.abs(bounds[0][1] - bounds[1][1]); 246 double zMax = Math.abs(bounds[0][2] - bounds[1][2]); 247 return Math.max(xMax, Math.max(yMax, zMax)); 248 } 249 250 /** 251 * Returns the maximum extend of the biological molecule in the x, y, or z direction. 252 * @param structure 253 * @return maximum extend 254 */ 255 public static double getBiologicalMoleculeMaximumExtend( final Structure structure,List<BiologicalAssemblyTransformation> transformations ) { 256 double[][] bounds = getBiologicalMoleculeBounds(structure, transformations); 257 double xMax = Math.abs(bounds[0][0] - bounds[1][0]); 258 double yMax = Math.abs(bounds[0][1] - bounds[1][1]); 259 double zMax = Math.abs(bounds[0][2] - bounds[1][2]); 260 return Math.max(xMax, Math.max(yMax, zMax)); 261 } 262 263 /** 264 * Returns the centroid of the biological molecule. 265 * @param asymUnit 266 * @return centroid 267 * @throws IllegalArgumentException if structure is null 268 */ 269 public static double[] getBiologicalMoleculeCentroid( final Structure asymUnit, List<BiologicalAssemblyTransformation> transformations ) { 270 if ( asymUnit == null ) { 271 throw new IllegalArgumentException( "null structure" ); 272 } 273 274 Atom[] atoms = StructureTools.getAllAtomArray(asymUnit); 275 int atomCount = atoms.length; 276 double[] centroid = new double[3]; 277 278 if ( atomCount <= 0 ) { 279 return centroid; 280 } 281 282 if ( transformations.size() == 0) { 283 return Calc.getCentroid(atoms).getCoords(); 284 285 } 286 287 288 289 int count = 0; 290 double[] transformedCoordinate = new double[3]; 291 292 for (int i = 0; i < atomCount; i++) 293 { 294 Atom atom = atoms[i]; 295 Chain chain = atom.getGroup().getChain(); 296 String intChainID = chain.getId(); 297 298 299 for (BiologicalAssemblyTransformation m: transformations) { 300 if (! m.getChainId().equals(intChainID)) 301 continue; 302 303 Point3d coords = atom.getCoordsAsPoint3d(); 304 transformedCoordinate[0] = coords.x; 305 transformedCoordinate[1] = coords.y; 306 transformedCoordinate[2] = coords.z; 307 m.transformPoint(transformedCoordinate); 308 centroid[0] += transformedCoordinate[0]; 309 centroid[1] += transformedCoordinate[1]; 310 centroid[2] += transformedCoordinate[2]; 311 count++; 312 } 313 } 314 315 316 317 centroid[0] /= count; 318 centroid[1] /= count; 319 centroid[2] /= count; 320 321 return centroid; 322 } 323 324 /** 325 * Reduce a structure to a single-atom representation (e.g. CA atoms) 326 * 327 * @param orig 328 * @return 329 * @since Biojava 4.1.0 330 */ 331 public static Structure getReducedStructure(Structure orig){ 332 Structure s = new StructureImpl(); 333 s.setPDBHeader(orig.getPDBHeader()); 334 for ( Chain c : orig.getChains()){ 335 336 Chain c1 = new ChainImpl(); 337 c1.setId(c.getId()); 338 c1.setName(c.getName()); 339 c1.setEntityInfo(c.getEntityInfo()); 340 s.addChain(c1); 341 342 for (Group g : c.getAtomGroups()){ 343 344 Atom a = null; 345 switch(g.getType()) { 346 case AMINOACID: 347 a = g.getAtom(StructureTools.CA_ATOM_NAME); 348 break; 349 case NUCLEOTIDE: 350 a = g.getAtom(StructureTools.NUCLEOTIDE_REPRESENTATIVE); 351 break; 352 default: 353 //omit group 354 } 355 if ( a != null){ 356 357 Group g1 = (Group)g.clone(); 358 g1.clearAtoms(); 359 g1.addAtom(a); 360 c1.addGroup(g1); 361 362 } 363 364 } 365 366 } 367 return s; 368 } 369 370}