001/*
002 *                    BioJava development code
003 *
004 * This code may be freely distributed and modified under the
005 * terms of the GNU Lesser General Public Licence.  This should
006 * be distributed with the code.  If you do not have a copy,
007 * see:
008 *
009 *      http://www.gnu.org/copyleft/lesser.html
010 *
011 * Copyright for this code is held jointly by the individual
012 * authors.  These should be listed in @author doc comments.
013 *
014 * For more information on the BioJava project and its aims,
015 * or to join the biojava-l mailing list, visit the home page
016 * at:
017 *
018 *      http://www.biojava.org/
019 *
020 * Created on 05.03.2004
021 * @author Andreas Prlic
022 *
023 */
024package org.biojava.nbio.structure;
025
026import org.biojava.nbio.structure.chem.ChemComp;
027
028import java.io.Serializable;
029import java.util.Iterator;
030import java.util.List;
031import java.util.Map;
032
033/**
034 *
035 * This is the data structure for a single Group of atoms.  A protein
036 * sequence ({@link Chain} in PDB file) is represented as a list of Groups.
037 * There are 3 types of Groups:
038 *
039 * <ul>
040 * <li>{@link AminoAcid}</li>
041 * <li>{@link HetatomImpl Hetatom}</li>
042 * <li>{@link NucleotideImpl Nucleotide}</li>
043 * </ul>
044 *
045 *
046 * @see HetatomImpl
047 * @see AminoAcidImpl
048 * @see NucleotideImpl
049 * @author Andreas Prlic
050 * @author Horvath Tamas
051 * @since 1.4
052 * @version %I% %G%
053 *
054 */
055public interface Group extends Serializable {
056
057        /** Group property key for secondary structure annotation */
058        public static final String SEC_STRUC = "secstruc";
059
060        /**
061         * Get number of atoms.
062         * @return number of atoms of this Group
063         */
064        public int size();
065
066        /**
067         * Return true or false, depending if this group has 3D coordinates or not.
068         *
069         * @return true if Group has 3D coordinates
070         */
071        public boolean has3D ();
072
073        /**
074         * Flag if group has 3D data .
075         *
076         * @param flag  true to set flag that this Group has 3D coordinates
077         */
078        public void setPDBFlag(boolean flag);
079
080        /**
081         * Get Type of group, one of {@link GroupType#AMINOACID}, {@link GroupType#HETATM}
082         * or {@link GroupType#NUCLEOTIDE}
083         *
084         * @return a String representing the type value
085         */
086        public GroupType getType();
087
088        /**
089         * Add an atom to this group.
090         *
091         * @param atom  an Atom object
092         */
093        public void addAtom(Atom atom);
094
095        /**
096         * Get list of atoms.
097         *
098         * @return a List object representing the atoms
099         * @see #setAtoms(List)
100         */
101        public List<Atom> getAtoms() ;
102
103
104        /**
105         * Set the atoms of this group.
106         * @see Atom
107         * @param atoms a list of atoms
108         */
109        public void setAtoms(List<Atom> atoms);
110
111        /**
112         * Remove all atoms from this group.
113         *
114         */
115        public void clearAtoms();
116
117        /**
118         * Get an atom given its PDB name.
119         * Beware that some PDB atom names are ambiguous (e.g. CA, which means C-alpha or Calcium),
120         * ambiguities should not occur within the same group though. To solve these ambiguities
121         * one would need to check the atom returned for the required element with {@link Atom#getElement()}
122         * <p>
123         * Note this method will return only the atom in the default alternative location (be it '.' or a letter).
124         *
125         * @param name  a trimmed String representing the atom's PDB name, e.g. "CA"
126         * @return an Atom object or null if no such atom exists within this group
127         */
128        public Atom getAtom(String name) ;
129
130        /**
131         * Get at atom by position.
132         *
133         * @param position  an int
134         * @return an Atom object or null if no Atom exists for given position
135         */
136        public Atom getAtom(int position) ;
137
138        /**
139         * Tell whether a particular atom exists within this group.
140         * Beware that some PDB atom names are ambiguous (e.g. CA, which means C-alpha or Calcium),
141         * ambiguities should not occur within the same group though.
142         *
143         * @param name  a trimmed String representing the atom's PDB name, e.g. "CA"
144         * @return true if Atom with name exists within this group
145         */
146        public boolean hasAtom(String name);
147
148        /**
149         * Get the PDB 3-letter name for this group. (e.g. ALA)
150         *
151         * @return a String representing the PDBName value
152         * @see #setPDBName
153         */
154        public String getPDBName();
155
156        /**
157         * Set the PDB 3-letter name for this group. (e.g. ALA)
158         *
159         * @param s  a String specifying the PDBName value
160         * @see #getPDBName
161         */
162        public void setPDBName(String s) ;
163
164
165        /**
166         * Calculate if this group has all atoms required for an amino acid backbone.
167         * This allows to include chemically modified amino acids that
168         * are labeled hetatoms into some computations, the usual way
169         * to identify if a group is an amino acid is {@link #getType()}
170         * <p>
171         * amino atoms are : N, CA, C, O
172         * </p>
173         *
174         * Example: 1DW9 chain A first group is a Selenomethionine, provided as HETATM, but here returns true.
175         * <pre>
176         * HETATM    1  N   MSE A   1      11.720  20.973   1.584  0.00  0.00           N
177         * HETATM    2  CA  MSE A   1      10.381  20.548   1.139  0.00  0.00           C
178         * HETATM    3  C   MSE A   1       9.637  20.037   2.398  0.00  0.00           C
179         * HETATM    4  O   MSE A   1      10.198  19.156   2.985  0.00  0.00           O
180         * HETATM    5  CB  MSE A   1      10.407  19.441   0.088  0.00  0.00           C
181         * </pre>
182         *
183         * @return true if all Atoms required for an AminoAcid are available (N, CA, C, O)
184         * @see #getType
185         */
186        public boolean hasAminoAtoms() ;
187
188
189        /**
190         * Check if this group is a polymeric group, from the definition in Chemical Component Dictionary
191         *
192         * @return true if a polymeric group
193         */
194        public boolean isPolymeric();
195
196
197        /**
198         * Check if this group is an aminoacid group, from the definition in Chemical Component Dictionary
199         *
200         * @return true if an amino acid
201         */
202        public boolean isAminoAcid();
203
204
205        /**
206         * Check if this group is a nucleotide group, from the definition in Chemical Component Dictionary
207         *
208         * @return true if a nucleotide
209         */
210        public boolean isNucleotide();
211
212
213
214        /**
215         * Properties of this amino acid. Currently available properties are:
216         * phi
217         * psi
218         * secstruc
219         *
220         * @param properties  a Map object specifying the properties value
221         * @see #getProperties
222         */
223        public void setProperties(Map<String,Object> properties) ;
224
225        /**
226         * Return properties.
227         * @see #setProperties
228         *
229         * @return a HashMap object representing the properties value
230         */
231        public Map<String,Object> getProperties() ;
232
233        /**
234         * Set a single property .
235         *
236         * @param key    a String
237         * @param value  an Object
238         * @see #getProperty
239         */
240        public void setProperty(String key, Object value) ;
241
242        /**
243         * Get a single property .
244         *
245         * @param key  a String
246         * @return an Object
247         * @see #setProperty
248         */
249        public Object getProperty(String key) ;
250
251        /**
252         * Get an Atom Iterator.
253         *
254         * @return an Iterator object
255         */
256        public Iterator<Atom> iterator() ;
257
258
259        /**
260         * Returns and identical copy of this Group object .
261         * @return  and identical copy of this Group object
262         */
263        public Object clone();
264
265        /**
266         * Sets the back-reference to its parent Chain.
267         * @param chain the parent Chain
268         * @see #getChain()
269         * @since 3.0
270         */
271        public void setChain(Chain chain);
272
273        /**
274         * Returns the parent Chain of the Group.
275         *
276         * @return Chain the Chain object that contains the Group
277         * @see #setChain(Chain)
278         * @since 3.0
279         */
280        public Chain getChain() ;
281
282        /**
283         * Returns a dynamically created ResidueNumber for the group - this
284         * contains the chainId, resNum and insCode of the group.
285         * @see ResidueNumber
286         * @return ResidueNumber for the group.
287         * @since 3.0
288         */
289        public ResidueNumber getResidueNumber();
290
291
292        /**
293         * Sets the ResidueNumber for this Group
294         *
295         * @param residueNumber the PDB residueNumber
296         */
297        public void setResidueNumber(ResidueNumber residueNumber);
298
299        /**
300         * Utility method to temporarily set a chainID for a group, if a parent chain object does not exist yet.
301         * Not recommended for general use other than parsing.
302         *
303         * @param chainId
304         * @param residueNumber
305         * @param iCode
306         */
307        public void setResidueNumber(String chainId, Integer residueNumber, Character iCode);
308
309        /**
310         * Utility method for returning the chainId of the Group or null if no
311         * Chain has been set. This is equivalent to calling getChain().getId()
312         *
313         * Prior to version 5.0 this method returned the chain name.
314         * @since 3.0
315         * @return  the ID of the chain
316         */
317        public String getChainId();
318
319        /**
320         * Set the Chemical Component that closer describes this group.
321         *
322         * @param cc the chemical component
323         */
324        public void setChemComp(ChemComp cc);
325
326        /**
327         * Get the chemical component that closer describes this group. If the information does not exist yet, fetches the information from PDB web site.
328         *
329         * @return the Chemical Component definition for this Group.
330         */
331        public ChemComp getChemComp();
332
333
334        /**
335         * Check if this group has alternate location groups.
336         *
337         * @return boolean flag if there are alternate locations.
338         * @see #getAltLocs()
339         */
340        public boolean hasAltLoc();
341
342
343        /**
344         * Get the list of other alternate location groups.
345         * <p>
346         * The main group (this group) will contain the first altloc (be it the default '.' or 'A' or a mix of '.' and 'A').
347         * <p>
348         * This method will return the altloc groups that are not the main group, e.g.:
349         * <ul>
350         * <li> if '.' (default), 'A' and 'B' altlocs are present in file, the main group will contain
351         * the default '.' and this method will return 2 altloc groups
352         * </li>
353         *
354         * <li> if 'A' and 'B' are present in file without a default '.' group, then the main group will contain the 'A'
355         * location whilst this method will return only 1 altloc group with the 'B' location
356         * </li>
357         * </ul>
358         * <p>
359         * Note that atoms with the default altloc (.) are included in all groups. Atoms with other altlocs (typically A, B, etc)
360         * will be sorted into groups by altloc.
361         * <p>
362         * Thus it can happen that an altloc group duplicate the contents of the main group.
363         *
364         * @return List of other groups that are on alternate locations
365         */
366        public List<Group> getAltLocs();
367
368        /**
369         * Add a group that is an alternate location for this group.
370         *
371         * @param g the altloc group to add
372         */
373        public void addAltLoc(Group g);
374
375        /**
376         * Determines if this group is water.
377         *
378         * @see GroupType#WATERNAMES
379         * @return true if it's water, false otherwise.
380         */
381        public boolean isWater();
382
383        /**
384         * Gets the alternate location group to this group that has the alt-loc character code passed.
385         *
386         * @param altLoc the alternate location code of the group desired
387         * @return the alternate location group if found, or null otherwise
388         */
389        public Group getAltLocGroup(Character altLoc);
390
391
392        /**
393         * Attempts to reduce the memory imprint of this group by trimming
394         * all internal Collection objects to the required size.
395         *
396         */
397        public void trimToSize();
398
399        /**
400         * Function to get the Group as an MDL molblock
401         * @return the string of the MDL molblock
402         */
403        public String toSDF();
404
405        /**
406         * Tells whether the group is annotated as HETATM in the file.
407         * To be used only at parsing time to be able to infer that a
408         * polymeric group is in a ligand chain or not.
409         * @return
410         */
411        public boolean isHetAtomInFile();
412
413        /**
414         * Sets the field isHetAtomInFile which is intented only for
415         * helping in infering if a polymeric group is in a ligand chain
416         * or in a polymeric chain.
417         * @param isHetAtomInFile
418         */
419        public void setHetAtomInFile(boolean isHetAtomInFile);
420}