001/* 002 * BioJava development code 003 * 004 * This code may be freely distributed and modified under the 005 * terms of the GNU Lesser General Public Licence. This should 006 * be distributed with the code. If you do not have a copy, 007 * see: 008 * 009 * http://www.gnu.org/copyleft/lesser.html 010 * 011 * Copyright for this code is held jointly by the individual 012 * authors. These should be listed in @author doc comments. 013 * 014 * For more information on the BioJava project and its aims, 015 * or to join the biojava-l mailing list, visit the home page 016 * at: 017 * 018 * http://www.biojava.org/ 019 * 020 */ 021package org.biojava.nbio.structure.secstruc; 022 023import org.biojava.nbio.structure.*; 024import org.biojava.nbio.structure.contact.AtomContact; 025import org.biojava.nbio.structure.contact.AtomContactSet; 026import org.biojava.nbio.structure.contact.Grid; 027import org.biojava.nbio.structure.contact.Pair; 028import org.slf4j.Logger; 029import org.slf4j.LoggerFactory; 030 031import java.util.ArrayList; 032import java.util.Arrays; 033import java.util.Collections; 034import java.util.Comparator; 035import java.util.HashMap; 036import java.util.Iterator; 037import java.util.List; 038import java.util.Map; 039 040/** 041 * Calculate and assign the secondary structure (SS) to the 042 * Groups of a Structure object. This object also stores the result 043 * of the calculation. 044 * <p> 045 * The rules for SS calculation are the ones defined by DSSP: 046 * Kabsch,W. and Sander,C. (1983) Biopolymers 22, 2577-2637. 047 * Original DSSP article see at: 048 * <a href="http://www.cmbi.kun.nl/gv/dssp/dssp.pdf">dssp.pdf</a>. 049 * Some parts are also taken from: T.E.Creighton, Proteins - 050 * Structure and Molecular Properties, 2nd Edition, Freeman 1994. 051 * 052 * @author Andreas Prlic 053 * @author Aleix Lafita 054 * @author Anthony Bradley 055 * 056 */ 057public class SecStrucCalc { 058 059 /** 060 * DSSP assigns helices one residue shorter at each end, because the 061 * residues at (i-1) and (i+n+1) are not assigned helix type although 062 * they contain a consistent turn (H-bond). If this parameter 063 * is true, the helices will be the length of the original DSSP 064 * convention. If it is false, they will be two residue longer. 065 */ 066 private static final boolean DSSP_HELICES = true; 067 068 private static final Logger logger = 069 LoggerFactory.getLogger(SecStrucCalc.class); 070 071 /** min distance between two residues */ 072 public static final double MINDIST = 0.5; 073 074 /** min distance of two CA atoms if H-bonds are allowed to form */ 075 public static final double CA_MIN_DIST = 9.0; 076 077 /** max distance CA atoms in peptide bond (backbone discontinuity) */ 078 public static final double MAX_PEPTIDE_BOND_LENGTH = 2.5; 079 080 /** Minimal H-bond energy in cal/mol */ 081 public static final int HBONDLOWENERGY = -9900; 082 083 /** higher limit for H-bond energy */ 084 public static final double HBONDHIGHENERGY = -500.0; 085 086 /** 087 * constant for electrostatic energy 088 * <pre> 089 * f * q1 * q2 * scale 090 * Q = -332 * 0.42 * 0.20 * 1000.0 091 *</pre> 092 * 093 * q1 and q2 are partial charges which are placed on the C,O 094 * (+q1,-q1) and N,H (-q2,+q2) 095 */ 096 public static final double Q = -27888.0; 097 098 // Three lists 099 private SecStrucGroup[] groups; 100 private List<Ladder> ladders; 101 private List<BetaBridge> bridges; 102 private Atom[] atoms; 103 // Added by Anthony - to speed up intergroup calculations 104 private AtomContactSet contactSet; 105 private Map<ResidueNumber, Integer> indResMap; 106 public SecStrucCalc(){ 107 ladders = new ArrayList<>(); 108 bridges = new ArrayList<>(); 109 } 110 111 112 /** 113 * Predicts the secondary structure of this Structure object, 114 * using a DSSP implementation. 115 * 116 * @param s Structure to predict the SS 117 * @param assign sets the SS information to the Groups of s 118 * @return a List of SS annotation objects 119 */ 120 public List<SecStrucState> calculate(Structure s, boolean assign) 121 throws StructureException { 122 123 List<SecStrucState> secstruc = new ArrayList<>(); 124 for(int i=0; i<s.nrModels(); i++) { 125 // Reinitialise the global vars 126 ladders = new ArrayList<>(); 127 bridges = new ArrayList<>(); 128 groups = initGroupArray(s, i); 129 // Initialise the contact set for this structure 130 initContactSet(); 131 if (groups.length < 5) { 132 // not enough groups to do anything 133 throw new StructureException("Not enough backbone groups in the" 134 + " Structure to calculate the secondary structure (" 135 + groups.length+" given, minimum 5)" ); 136 } 137 138 calculateHAtoms(); 139 calculateHBonds(); 140 calculateDihedralAngles(); 141 calculateTurns(); 142 buildHelices(); 143 detectBends(); 144 detectStrands(); 145 146 for (SecStrucGroup sg : groups){ 147 SecStrucState ss = (SecStrucState) 148 sg.getProperty(Group.SEC_STRUC); 149 // Add to return list and assign to original if flag is true 150 secstruc.add(ss); 151 if (assign) sg.getOriginal().setProperty(Group.SEC_STRUC, ss); 152 } 153 } 154 return secstruc; 155 } 156 157 /** 158 * Function to generate the contact sets 159 */ 160 private void initContactSet() { 161 162 // Initialise an array of atoms 163 atoms = new Atom[groups.length]; 164 // Remake this local var 165 indResMap = new HashMap<>(); 166 for (int i=0 ; i < groups.length ; i++){ 167 SecStrucGroup one = groups[i]; 168 indResMap.put(one.getResidueNumber(), i); 169 atoms[i] = one.getCA(); 170 } 171 Grid grid = new Grid(CA_MIN_DIST); 172 if(atoms.length==0){ 173 contactSet = new AtomContactSet(CA_MIN_DIST); 174 } 175 else{ 176 grid.addAtoms(atoms); 177 contactSet = grid.getAtomContacts(); 178 } 179 } 180 181 /** 182 * Updated code to detect strands 183 */ 184 private void detectStrands() { 185 186 //Find all the beta bridges of the structure 187 findBridges(); 188 //Create Ladders 189 createLadders(); 190 191 //Detect beta bulges between ladders 192 connectLadders(); 193 194 //AND store SS assignments for Sheets, Strands and Bridges 195 updateSheets(); 196 } 197 198 199 private void createLadders(){ 200 201 for (BetaBridge b : bridges){ 202 boolean found = false; 203 for (Ladder ladder : ladders){ 204 if (shouldExtendLadder(ladder, b)) { 205 found = true; 206 ladder.to++; //we go forward in this direction 207 switch(b.type){ 208 case parallel: 209 ladder.lto++; //increment second strand 210 break; 211 case antiparallel: 212 ladder.lfrom--; //decrement second strand 213 break; 214 } 215 break; 216 } 217 } 218 if (!found){ 219 //Create new ladder with a single Bridge 220 Ladder l = new Ladder(); 221 l.from = b.partner1; 222 l.to = b.partner1; 223 l.lfrom = b.partner2; 224 l.lto = b.partner2; 225 l.btype = b.type; 226 ladders.add(l); 227 } 228 } 229 } 230 231 232 private void updateSheets() { 233 234 logger.debug(" got {} ladders!", ladders.size()); 235 236 for (Ladder ladder : ladders){ 237 logger.debug(ladder.toString()); 238 239 for (int lcount = ladder.from; lcount <= ladder.to; lcount++) { 240 241 SecStrucState state = getSecStrucState(lcount); 242 SecStrucType stype = state.getType(); 243 244 int diff = ladder.from - lcount; 245 int l2count = ladder.lfrom - diff ; 246 247 SecStrucState state2 = getSecStrucState(l2count); 248 SecStrucType stype2 = state2.getType(); 249 250 if ( ladder.from != ladder.to ) { 251 setSecStrucType(lcount, SecStrucType.extended); 252 setSecStrucType(l2count, SecStrucType.extended); 253 } 254 else { 255 if ( !stype.isHelixType() && 256 ( !stype.equals(SecStrucType.extended))) 257 setSecStrucType(lcount,SecStrucType.bridge); 258 259 if ( ! stype2.isHelixType() && 260 (! stype2.equals(SecStrucType.extended))) 261 setSecStrucType(l2count,SecStrucType.bridge); 262 } 263 } 264 265 // Check if two ladders are connected. both sides are 'E' 266 267 if (ladder.connectedTo == 0) continue; 268 Ladder conladder = ladders.get(ladder.connectedTo); 269 270 if (ladder.btype.equals(BridgeType.antiparallel)) { 271 /* set one side */ 272 for (int lcount = ladder.from; lcount <= conladder.to; 273 lcount++) { 274 setSecStrucType(lcount, SecStrucType.extended); 275 276 } 277 /* set other side */ 278 for (int lcount = conladder.lto; 279 lcount <= ladder.lfrom; 280 lcount++) { 281 setSecStrucType(lcount, SecStrucType.extended); 282 } 283 284 } else { 285 /* set one side */ 286 for ( int lcount = ladder.from; 287 lcount <= conladder.to; 288 lcount++) { 289 290 setSecStrucType(lcount, SecStrucType.extended); 291 } 292 /* set other side */ 293 for ( int lcount = ladder.lfrom; 294 lcount <= conladder.lto; 295 lcount++) { 296 297 setSecStrucType(lcount, SecStrucType.extended); 298 } 299 } 300 } 301 } 302 303 private void connectLadders() { 304 305 for (int i = 0 ; i < ladders.size(); i++) { 306 for ( int j = i ; j < ladders.size(); j++){ 307 Ladder l1 = ladders.get(i); 308 Ladder l2 = ladders.get(j); 309 if (hasBulge(l1,l2)) { 310 l1.connectedTo = j; 311 l2.connectedFrom = i; 312 logger.debug("Bulge from {} to {}", i, j); 313 } 314 } 315 } 316 317 318 } 319 320 /** 321 * For beta structures, we define explicitly: a bulge-linked 322 * ladder consists of two (perfect) ladder or bridges of the 323 * same type connected by at most one extra residue on one 324 * strand and at most four extra residues on the other strand, 325 * all residues in bulge-linked ladders are marked "E," 326 * including the extra residues. 327 */ 328 private boolean hasBulge(Ladder l1, Ladder l2) { 329 330 boolean bulge = ((l1.btype.equals(l2.btype)) && 331 (l2.from - l1.to < 6) && 332 (l1.to < l2.from) && 333 (l2.connectedTo == 0)); 334 335 if (!bulge) return bulge; 336 337 switch(l1.btype){ 338 case parallel: 339 bulge = ( (l2.lfrom - l1.lto > 0) && 340 ((( l2.lfrom -l1.lto < 6) && 341 (l2.from - l1.to < 3)) || 342 ( l2.lfrom - l1.lto <3))); 343 344 break; 345 346 case antiparallel: 347 bulge = ( (l1.lfrom - l2.lto > 0) && 348 (((l1.lfrom -l2.lto < 6) && 349 ( l2.from - l1.to < 3)) || 350 (l1.lfrom - l2.lto < 3))); 351 352 break; 353 } 354 355 return bulge; 356 } 357 358 private void registerBridge(int i, int j, BridgeType btype) { 359 360 BetaBridge bridge = new BetaBridge(i,j,btype); 361 362 boolean b1 = getSecStrucState(i).addBridge(bridge); 363 boolean b2 = getSecStrucState(j).addBridge(bridge); 364 365 if (!b1 && !b2) 366 logger.warn("Ignoring Bridge between residues {} and {}. DSSP assignment might differ.", i, j); 367 368 bridges.add(bridge); 369 } 370 371 /** 372 * Conditions to extend a ladder with a given beta Bridge: 373 * <li>The bridge and ladder are of the same type. 374 * <li>The smallest bridge residue is sequential to the first 375 * strand ladder. 376 * <li>The second bridge residue is either sequential (parallel) 377 * or previous (antiparallel) to the second strand of the ladder 378 * </li> 379 * @param ladder the ladder candidate to extend 380 * @param b the beta bridge that would extend the ladder 381 * @return true if the bridge b extends the ladder 382 */ 383 private boolean shouldExtendLadder(Ladder ladder, BetaBridge b) { 384 385 //Only extend if they are of the same type 386 boolean sameType = b.type.equals(ladder.btype); 387 if (!sameType) return false; 388 389 //Only extend if residue 1 is sequential to ladder strand 390 boolean sequential = (b.partner1 == ladder.to+1); 391 if (!sequential) return false; 392 393 switch(b.type){ 394 case parallel: 395 //Residue 2 should be sequential to second strand 396 if (b.partner2 == ladder.lto+1) return true; 397 break; 398 case antiparallel: 399 //Residue 2 should be previous to second strand 400 if (b.partner2 == ladder.lfrom-1) return true; 401 break; 402 } 403 return false; 404 } 405 406 407 408 409 /** 410 * Two nonoverlapping stretches of three residues each, i-1,i,i+1 and 411 * j-1,j,j+1, form either a parallel or antiparallel bridge, depending on 412 * which of two basic patterns is matched. We assign a bridge between 413 * residues i and j if there are two H bonds characteristic of beta- 414 * structure; in particular: 415 * <p> 416 * Parallel Bridge(i,j) =: [Hbond(i-1,j) and Hbond(j,i+1)] 417 * or [Hbond(j-1,i) and Hbond(i,j+1)] 418 * <p> 419 * Antiparallel Bridge(i,j) =: [Hbond(i,j) and Hbond(j,i)] 420 * or [Hbond(i-1,j+1) and Hbond(j-1,i+1)] 421 * 422 * Optimised to use the contact set 423 */ 424 private void findBridges() { 425 // Get the interator of contacts 426 Iterator<AtomContact> myIter = contactSet.iterator(); 427 List<Pair<Integer>> outList = new ArrayList<>(); 428 429 // Now iterate through this 430 while(myIter.hasNext()){ 431 // Get the next atom contact 432 AtomContact ac = myIter.next(); 433 Group g1 = ac.getPair().getFirst().getGroup(); 434 Group g2 = ac.getPair().getSecond().getGroup(); 435 // Get the indices 436 int i = indResMap.get(g1.getResidueNumber()); 437 int j = indResMap.get(g2.getResidueNumber()); 438 // If i>j switch them over 439 if(i>j){ 440 // Switch them over 441 int old = i; 442 i = j; 443 j = old; 444 } 445 // Only these 446 if(j<i+3){ 447 continue; 448 } 449 // If it's the first 450 if(i==0){ 451 continue; 452 } 453 if(j==0){ 454 continue; 455 } 456 // If it's the last 457 if(i==groups.length-1){ 458 continue; 459 } 460 if(j==groups.length-1){ 461 continue; 462 } 463 464 Pair<Integer> thisPair = new Pair<>(i,j); 465 outList.add(thisPair); 466 } 467 // 468 Collections.sort(outList, new Comparator<Pair<Integer>>() { 469 @Override 470 public int compare(Pair<Integer> o1, Pair<Integer> o2) { 471 if(o1.getFirst()<o2.getFirst()){ 472 return -1; 473 } 474 else if(o1.getFirst()>o2.getFirst()){ 475 return +1; 476 } 477 else{ 478 if(o1.getSecond()<o2.getSecond()){ 479 return -1; 480 } 481 else if(o1.getSecond()>o2.getSecond()){ 482 return 1; 483 } 484 else{ 485 return 0; 486 } 487 } 488 } 489 }); 490 491 492 493 for(Pair<Integer> p: outList){ 494 int i = p.getFirst(); 495 int j = p.getSecond(); 496 BridgeType btype = null; 497 // Now do the bonding 498 if ((isBonded(i-1,j) && isBonded(j,i+1)) || 499 (isBonded(j-1,i) && isBonded(i,j+1))) { 500 btype = BridgeType.parallel; 501 } 502 else if ((isBonded(i,j) && isBonded(j,i)) || 503 (isBonded(i-1,j+1) && (isBonded(j-1,i+1)))) { 504 btype = BridgeType.antiparallel; 505 } 506 if (btype != null){ 507 registerBridge(i, j, btype); 508 } 509 } 510 511 512 } 513 514 private void detectBends() { 515 516 for (int i = 2 ; i < groups.length-2 ;i++){ 517 518 //Check if all atoms form peptide bonds (backbone discontinuity) 519 boolean bonded = true; 520 for (int k=0; k<4; k++){ 521 int index = i+k-2; 522 Atom C = groups[index].getC(); 523 Atom N = groups[index+1].getN(); 524 //Peptide bond C-N 525 if (Calc.getDistance(C, N) > MAX_PEPTIDE_BOND_LENGTH){ 526 bonded = false; 527 break; 528 } 529 } 530 if (!bonded) continue; 531 532 SecStrucGroup im2 = groups[i-2]; 533 SecStrucGroup g = groups[i]; 534 SecStrucGroup ip2 = groups[i+2]; 535 536 Atom caim2 = im2.getCA(); 537 Atom cag = g.getCA(); 538 Atom caip2 = ip2.getCA(); 539 540 //Create vectors ( Ca i to Ca i-2 ) ; ( Ca i to CA i + 2 ) 541 Atom caminus2 = Calc.subtract(caim2,cag); 542 Atom caplus2 = Calc.subtract(cag,caip2); 543 544 double angle = Calc.angle(caminus2, caplus2); 545 546 SecStrucState state = getSecStrucState(i); 547 state.setKappa((float) angle); 548 549 //Angles = 360 should be discarded 550 if (angle > 70.0 && angle < 359.99) { 551 setSecStrucType(i, SecStrucType.bend); 552 state.setBend(true); 553 } 554 } 555 } 556 557 private void calculateDihedralAngles() { 558 559 // dihedral angles 560 // phi: C-N-CA-C 561 // psi: N-CA-C-N 562 // Chi1: N-CA-CB-CG, N-CA-CB-OG(SER),N-CA-CB-OG1(Thr), 563 // N-CA-CB-CG1(ILE/VAL), N-CA-CB-SG(CYS) 564 // Omega: CA-C-N-CA 565 566 for (int i=0 ; i < groups.length-1 ; i++){ 567 568 SecStrucGroup a = groups[i]; 569 SecStrucGroup b = groups[i+1]; 570 571 Atom a_N = a.getN(); 572 Atom a_CA = a.getCA(); 573 Atom a_C = a.getC(); 574 575 Atom b_N = b.getN(); 576 Atom b_CA = b.getCA(); 577 Atom b_C = b.getC(); 578 579 double phi = Calc.torsionAngle(a_C,b_N,b_CA,b_C); 580 double psi = Calc.torsionAngle(a_N,a_CA,a_C,b_N); 581 double omega = Calc.torsionAngle(a_CA,a_C,b_N,b_CA); 582 583 SecStrucState state1 = (SecStrucState) 584 a.getProperty(Group.SEC_STRUC); 585 SecStrucState state2 = (SecStrucState) 586 b.getProperty(Group.SEC_STRUC); 587 588 state2.setPhi(phi); 589 state1.setPsi(psi); 590 state1.setOmega(omega); 591 } 592 } 593 594 @Override 595 public String toString() { 596 return printDSSP(); 597 } 598 599 /** 600 * Generate a DSSP file format ouput String of this SS prediction. 601 * @return String in DSSP output file format 602 */ 603 public String printDSSP() { 604 605 StringBuffer buf = new StringBuffer(); 606 String nl = System.getProperty("line.separator"); 607 608 //Header Line 609 buf.append("==== Secondary Structure Definition by BioJava" 610 + " DSSP implementation, Version October 2015 ===="+nl); 611 612 //First line with column definition 613 buf.append(" # RESIDUE AA STRUCTURE BP1 BP2 ACC " 614 + "N-H-->O O-->H-N N-H-->O O-->H-N " 615 + "TCO KAPPA ALPHA PHI PSI " 616 + "X-CA Y-CA Z-CA "); 617 618 for (int i =0 ; i < groups.length ;i++){ 619 buf.append(nl); 620 SecStrucState ss = getSecStrucState(i); 621 buf.append(ss.printDSSPline(i)); 622 } 623 624 return buf.toString(); 625 } 626 627 /** 628 * Generate a summary of this SS prediction with information about 629 * the three types of helix turns in different row sequences. 630 * <p> 631 * This is similar to the summary output of Jmol, and useful to visualize 632 * the helix patterns. 633 * 634 * @return String helix summary 635 */ 636 public String printHelixSummary() { 637 638 StringBuffer g = new StringBuffer(); //3-10 helix 639 StringBuffer h = new StringBuffer(); //alpha helix 640 StringBuffer i = new StringBuffer(); //pi-helix 641 StringBuffer ss = new StringBuffer(); //SS summary 642 StringBuffer aa = new StringBuffer(); //AA one-letter 643 String nl = System.getProperty("line.separator"); 644 645 g.append( "3 turn: "); 646 h.append( "4 turn: "); 647 i.append( "5 turn: "); 648 ss.append( "SS: "); 649 aa.append( "AA: "); 650 651 for (int k = 0; k < groups.length; k++){ 652 653 SecStrucState state = getSecStrucState(k); 654 g.append(state.getTurn()[0]); 655 h.append(state.getTurn()[1]); 656 i.append(state.getTurn()[2]); 657 ss.append(state.getType()); 658 aa.append(StructureTools.get1LetterCode(groups[k].getPDBName())); 659 } 660 661 return g.toString()+nl+h.toString()+nl+ 662 i.toString()+nl+ss.toString()+nl+aa.toString(); 663 } 664 665 /** 666 * Generate a FASTA sequence with the SS annotation letters in the 667 * aminoacid sequence order. 668 * @return String in FASTA sequence format 669 */ 670 public String printFASTA() { 671 672 StringBuffer buf = new StringBuffer(); 673 String nl = System.getProperty("line.separator"); 674 buf.append(">"+groups[0].getChain().getStructure().getIdentifier()+nl); 675 676 for (int g = 0; g < groups.length; g++){ 677 buf.append(getSecStrucState(g).getType()); 678 } 679 return buf.toString(); 680 } 681 682 @Override 683 public int hashCode() { 684 final int prime = 31; 685 int result = 1; 686 result = prime * result + Arrays.hashCode(atoms); 687 return result; 688 } 689 690 @Override 691 public boolean equals(Object o){ 692 693 if (!(o instanceof SecStrucCalc)) return false; 694 else { 695 SecStrucCalc ss = (SecStrucCalc) o; 696 if (groups.length != ss.groups.length) return false; 697 698 for (int g=0; g<groups.length; g++){ 699 SecStrucInfo g1 = getSecStrucState(g); 700 SecStrucInfo g2 = ss.getSecStrucState(g); 701 if (!g1.equals(g2)) return false; 702 } 703 return true; 704 } 705 } 706 707 private static SecStrucGroup[] initGroupArray(Structure s, int modelId) { 708 List<SecStrucGroup> groupList = new ArrayList<>(); 709 // 710 for ( Chain c : s.getChains(modelId)){ 711 712 for (Group g : c.getAtomGroups()){ 713 714 //We can also calc secstruc if it is a modified amino acid 715 if ( g.hasAminoAtoms()) { 716 717 SecStrucGroup sg = new SecStrucGroup(); 718 sg.setResidueNumber(g.getResidueNumber()); 719 sg.setPDBFlag(true); 720 sg.setPDBName(g.getPDBName()); 721 sg.setChain(g.getChain()); 722 723 Atom N = g.getAtom(StructureTools.N_ATOM_NAME); 724 Atom CA = g.getAtom(StructureTools.CA_ATOM_NAME); 725 Atom C = g.getAtom(StructureTools.C_ATOM_NAME); 726 Atom O = g.getAtom(StructureTools.O_ATOM_NAME); 727 if ( N == null || CA == null || C == null || O == null) 728 continue; 729 730 sg.setN((Atom) N.clone()); 731 sg.setCA((Atom) CA.clone()); 732 sg.setC((Atom) C.clone()); 733 sg.setO((Atom) O.clone()); 734 sg.setOriginal(g); 735 736 SecStrucState state = new SecStrucState(sg, 737 SecStrucInfo.BIOJAVA_ASSIGNMENT, 738 SecStrucType.coil); 739 740 sg.setProperty(Group.SEC_STRUC, state); 741 groupList.add(sg); 742 } 743 } 744 745 } 746 return groupList.toArray(new SecStrucGroup[groupList.size()]); 747 } 748 749 /** 750 * Calculate the coordinates of the H atoms. They are usually 751 * missing in the PDB files as only few experimental methods allow 752 * to resolve their location. 753 */ 754 private void calculateHAtoms() throws StructureException { 755 756 for ( int i = 0 ; i < groups.length-1 ; i++) { 757 758 SecStrucGroup a = groups[i]; 759 SecStrucGroup b = groups[i+1]; 760 761 if ( !b.hasAtom("H") ) { 762 //Atom H = calc_H(a.getC(), b.getN(), b.getCA()); 763 Atom H = calcSimple_H(a.getC(), a.getO(), b.getN()); 764 b.setH(H); 765 } 766 } 767 } 768 769 770 771 /** 772 * Calculate the HBonds between different groups. 773 * see Creighton page 147 f 774 * Modified to use only the contact map 775 */ 776 private void calculateHBonds() { 777 /** 778 * More efficient method for calculating C-Alpha pairs 779 */ 780 if (groups.length < 5) return; 781 Iterator<AtomContact> otu = contactSet.iterator(); 782 while(otu.hasNext()){ 783 AtomContact ac = otu.next(); 784 Pair<Atom> pair = ac.getPair(); 785 Group g1 = pair.getFirst().getGroup(); 786 Group g2 = pair.getSecond().getGroup(); 787 // Now I need to get the index of the Group in the list groups 788 int i = indResMap.get(g1.getResidueNumber()); 789 int j = indResMap.get(g2.getResidueNumber()); 790 // Now check this 791 checkAddHBond(i,j); 792 //"backwards" hbonds are not allowed 793 if (j!=(i+1)) checkAddHBond(j,i); 794 } 795 } 796 797 private void checkAddHBond(int i, int j){ 798 799 SecStrucGroup one = groups[i]; 800 801 if ("PRO".equals(one.getPDBName())){ 802 logger.debug("Ignore: PRO {}", one.getResidueNumber()); 803 return; 804 } 805 if (!one.hasAtom("H")) { 806 logger.debug("Residue {} has no H",one.getResidueNumber()); 807 return; 808 } 809 810 SecStrucGroup two = groups[j]; 811 812 double energy = 0; 813 814 try { 815 energy = calculateHBondEnergy(one,two); 816 } catch (Exception e){ 817 logger.warn("Energy calculation failed", e); 818 return; 819 } 820 logger.debug("Energy between positions ({},{}): ",i,j,energy); 821 822 trackHBondEnergy(i,j,energy); 823 } 824 825 /** 826 * Calculate HBond energy of two groups in cal/mol 827 * see Creighton page 147 f 828 * <p> 829 * Jeffrey, George A., An introduction to hydrogen bonding, 830 * Oxford University Press, 1997. 831 * categorizes hbonds with donor-acceptor distances of 832 * 2.2-2.5 å as "strong, mostly covalent", 833 * 2.5-3.2 å as "moderate, mostly electrostatic", 834 * 3.2-4.0 å as "weak, electrostatic". 835 * Energies are given as 40-14, 15-4, and <4 kcal/mol respectively. 836 */ 837 private static double calculateHBondEnergy(SecStrucGroup one, 838 SecStrucGroup two) { 839 840 Atom N = one.getN(); 841 Atom H = one.getH(); 842 843 Atom O = two.getO(); 844 Atom C = two.getC(); 845 846 double dno = Calc.getDistance(O,N); 847 double dhc = Calc.getDistance(C,H); 848 double dho = Calc.getDistance(O,H); 849 double dnc = Calc.getDistance(C,N); 850 851 logger.debug(" cccc: {} {} {} {} O ({})..N ({}):{} | ho:{} - hc:{} + nc:{} - no:{}", 852 one.getResidueNumber(),one.getPDBName(),two.getResidueNumber(),two.getPDBName(), 853 O.getPDBserial(),N.getPDBserial(),dno,dho,dhc,dnc,dno); 854 855 //there seems to be a contact! 856 if ( (dno < MINDIST) || (dhc < MINDIST) || 857 (dnc < MINDIST) || (dno < MINDIST)) { 858 return HBONDLOWENERGY; 859 } 860 861 double e1 = Q / dho - Q / dhc; 862 double e2 = Q / dnc - Q / dno; 863 864 double energy = e1 + e2; 865 866 logger.debug(" N ({}) O({}): {} : {} ",N.getPDBserial(),O.getPDBserial(),(float) dno,energy); 867 868 //Avoid too strong energy 869 if (energy > HBONDLOWENERGY) return energy; 870 871 return HBONDLOWENERGY ; 872 } 873 874 /** 875 * Store Hbonds in the Groups. 876 * DSSP allows two HBonds per aminoacids to allow bifurcated bonds. 877 */ 878 private void trackHBondEnergy(int i, int j, double energy) { 879 880 if ("PRO".equals(groups[i].getPDBName())) { 881 logger.debug("Ignore: PRO {}",groups[i].getResidueNumber()); 882 return; 883 } 884 885 SecStrucState stateOne = getSecStrucState(i); 886 SecStrucState stateTwo = getSecStrucState(j); 887 888 double acc1e = stateOne.getAccept1().getEnergy(); 889 double acc2e = stateOne.getAccept2().getEnergy(); 890 891 double don1e = stateTwo.getDonor1().getEnergy(); 892 double don2e = stateTwo.getDonor2().getEnergy(); 893 894 //Acceptor: N-H-->O 895 if (energy < acc1e) { 896 logger.debug("{} < {}",energy,acc1e); 897 stateOne.setAccept2(stateOne.getAccept1()); 898 899 HBond bond = new HBond(); 900 bond.setEnergy(energy); 901 bond.setPartner(j); 902 903 stateOne.setAccept1(bond); 904 905 } else if ( energy < acc2e ) { 906 logger.debug("{} < {}",energy,acc2e); 907 908 HBond bond = new HBond(); 909 bond.setEnergy(energy); 910 bond.setPartner(j); 911 912 stateOne.setAccept2(bond); 913 } 914 915 916 //The other side of the bond: donor O-->N-H 917 if (energy < don1e) { 918 logger.debug("{} < {}",energy,don1e); 919 stateTwo.setDonor2(stateTwo.getDonor1()); 920 921 HBond bond = new HBond(); 922 bond.setEnergy(energy); 923 bond.setPartner(i); 924 925 stateTwo.setDonor1(bond); 926 927 } else if ( energy < don2e ) { 928 logger.debug("{} < {}",energy,don2e); 929 930 HBond bond = new HBond(); 931 bond.setEnergy(energy); 932 bond.setPartner(i); 933 934 stateTwo.setDonor2(bond); 935 } 936 } 937 938 /** 939 * Detect helical turn patterns. 940 */ 941 private void calculateTurns(){ 942 943 for (int i = 0 ; i< groups.length; i++){ 944 for (int turn = 3; turn <= 5; turn++) { 945 946 if (i+turn >= groups.length) continue; 947 948 //Check for H bond from NH(i+n) to CO(i) 949 if (isBonded(i, i+turn)) { 950 logger.debug("Turn at ({},{}) turn {}",i,(i+turn),turn); 951 getSecStrucState(i).setTurn('>', turn); 952 getSecStrucState(i+turn).setTurn('<', turn); 953 //Bracketed residues get the helix number 954 for (int j=i+1; j<i+turn; j++){ 955 Integer t = turn; 956 char helix = t.toString().charAt(0); 957 getSecStrucState(j).setTurn(helix, turn); 958 } 959 } 960 } 961 } 962 } 963 964 /** 965 * Test if two groups are forming an H-Bond. The bond tested is 966 * from the CO of group i to the NH of group j. Acceptor (i) and 967 * donor (j). The donor of i has to be j, and the acceptor of j 968 * has to be i. 969 * DSSP defines H-Bonds if the energy < -500 cal/mol. 970 * 971 * @param i group one 972 * @param j group two 973 * @return flag if the two are forming an Hbond 974 */ 975 private boolean isBonded(int i, int j) { 976 977 SecStrucState one = getSecStrucState(i); 978 SecStrucState two = getSecStrucState(j); 979 980 double don1e = one.getDonor1().getEnergy(); 981 double don2e = one.getDonor2().getEnergy(); 982 double acc1e = two.getAccept1().getEnergy(); 983 double acc2e = two.getAccept2().getEnergy(); 984 985 int don1p = one.getDonor1().getPartner(); 986 int don2p = one.getDonor2().getPartner(); 987 int acc1p = two.getAccept1().getPartner(); 988 int acc2p = two.getAccept2().getPartner(); 989 990 //Either donor from i is j, or accept from j is i 991 boolean hbond = (don1p == j && don1e < HBONDHIGHENERGY) || 992 (don2p == j && don2e < HBONDHIGHENERGY) || 993 (acc1p == i && acc1e < HBONDHIGHENERGY) || 994 (acc2p == i && acc2e < HBONDHIGHENERGY); 995 996 if (hbond){ 997 logger.debug("*** H-bond from CO of {} to NH of {}", i, j); 998 return true; 999 } 1000 return false ; 1001 } 1002 1003 /** 1004 * Use unit vectors NC and NCalpha Add them. Calc unit vector and 1005 * substract it from N. 1006 * C coordinates are from amino acid i-1 1007 * N, CA atoms from amino acid i 1008 * 1009 * @link http://openbioinformatics.blogspot.com/ 1010 * 2009/08/how-to-calculate-h-atoms-for-nitrogens.html 1011 */ 1012 @SuppressWarnings("unused") 1013 private static Atom calc_H(Atom C, Atom N, Atom CA) 1014 throws StructureException { 1015 1016 Atom nc = Calc.subtract(N,C); 1017 Atom nca = Calc.subtract(N,CA); 1018 1019 Atom u_nc = Calc.unitVector(nc) ; 1020 Atom u_nca = Calc.unitVector(nca); 1021 1022 Atom added = Calc.add(u_nc,u_nca); 1023 1024 Atom U = Calc.unitVector(added); 1025 1026 // according to Creighton distance N-H is 1.03 +/- 0.02A 1027 Atom H = Calc.add(N,U); 1028 1029 H.setName("H"); 1030 // this atom does not have a pdbserial number ... 1031 return H; 1032 1033 } 1034 1035 private static Atom calcSimple_H(Atom c, Atom o, Atom n) { 1036 1037 Atom h = Calc.subtract(c,o); 1038 double dist = Calc.getDistance(o,c); 1039 //System.out.println(dist); 1040 double x = n.getX() + h.getX() / dist; 1041 double y = n.getY() + h.getY() / dist; 1042 double z = n.getZ() + h.getZ() / dist; 1043 1044 h.setX(x); 1045 h.setY(y); 1046 h.setZ(z); 1047 1048 h.setName("H"); 1049 return h; 1050 } 1051 1052 private void buildHelices(){ 1053 1054 //Alpha-helix (i+4), 3-10-helix (i+3), Pi-helix (i+5) 1055 checkSetHelix(4, SecStrucType.helix4); 1056 checkSetHelix(3, SecStrucType.helix3); 1057 checkSetHelix(5, SecStrucType.helix5); 1058 1059 checkSetTurns(); 1060 } 1061 1062 private void checkSetTurns() { 1063 1064 SecStrucType type = SecStrucType.turn; 1065 1066 for (int idx = 0; idx < 3; idx++) { 1067 for (int i = 0; i < groups.length-1; i++) { 1068 1069 SecStrucState state = getSecStrucState(i); 1070 char[] turn = state.getTurn(); 1071 1072 //Any turn opening matters 1073 if (turn[idx] == '>' || turn[idx] == 'X') { 1074 //Mark following n residues as turn 1075 for (int k=1; k<idx+3; k++){ 1076 setSecStrucType(i+k, type); 1077 } 1078 if (!DSSP_HELICES) { 1079 setSecStrucType(i, type); 1080 setSecStrucType(i+idx+3, type); 1081 } 1082 } 1083 } 1084 } 1085 } 1086 1087 /** 1088 * A minimal helix is defined by two consecutive n-turns. 1089 * For example, a 4-helix, of minimal length 4 from residues 1090 * i to (i+3), requires turns (of type 4) at residues (i-1) and i. 1091 * <p> 1092 * Note that the orignal DSSP implementation does not assign 1093 * helix type to residue (i-1) and residue (i+n+1), although 1094 * they contain a helix turn. As they state in the original paper, 1095 * "the helices are one residue shorter than they would be according 1096 * to rule 6.3 of IUPAC-IUB". 1097 * 1098 * @param n 1099 * @param type 1100 */ 1101 private void checkSetHelix(int n, SecStrucType type){ 1102 1103 int idx = n - 3; 1104 logger.debug("Set helix {} {} {}", type, n, idx); 1105 1106 for (int i = 1; i < groups.length-n; i++) { 1107 1108 SecStrucState state = getSecStrucState(i); 1109 SecStrucState previousState = getSecStrucState(i-1); 1110 1111 //Check that no other helix was assgined to this range 1112 if (state.getType().compareTo(type) < 0) continue; 1113 if (getSecStrucState(i+1).getType().compareTo(type) < 0) continue; 1114 1115 char turn = state.getTurn()[idx]; 1116 char pturn = previousState.getTurn()[idx]; 1117 1118 //Two consecutive n-turns present to define a n-helix 1119 if ((turn=='>' || turn=='X') && (pturn=='>' || pturn=='X')) { 1120 //Mark following n residues as turn 1121 for (int k=0; k<n; k++){ 1122 setSecStrucType(i+k, type); 1123 } 1124 if (!DSSP_HELICES) { 1125 setSecStrucType(i-1, type); 1126 setSecStrucType(i+n, type); 1127 } 1128 } 1129 } 1130 } 1131 1132 /** 1133 * Set the new type only if it has more preference than the 1134 * current residue SS type. 1135 * @param pos 1136 * @param type 1137 */ 1138 private void setSecStrucType(int pos, SecStrucType type){ 1139 SecStrucState ss = getSecStrucState(pos); 1140 if (type.compareTo(ss.getType()) < 0) ss.setType(type); 1141 } 1142 1143 private SecStrucState getSecStrucState(int pos){ 1144 Group g = groups[pos]; 1145 SecStrucState state = (SecStrucState) g.getProperty(Group.SEC_STRUC); 1146 return state; 1147 } 1148 1149}