001/*
002 *                    BioJava development code
003 *
004 * This code may be freely distributed and modified under the
005 * terms of the GNU Lesser General Public Licence.  This should
006 * be distributed with the code.  If you do not have a copy,
007 * see:
008 *
009 *      http://www.gnu.org/copyleft/lesser.html
010 *
011 * Copyright for this code is held jointly by the individual
012 * authors.  These should be listed in @author doc comments.
013 *
014 * For more information on the BioJava project and its aims,
015 * or to join the biojava-l mailing list, visit the home page
016 * at:
017 *
018 *      http://www.biojava.org/
019 *
020 * Created on June 24, 2010
021 * Author: Mark Chapman
022 */
023
024package org.biojava.nbio.alignment.template;
025
026import org.biojava.nbio.core.alignment.template.ProfilePair;
027import org.biojava.nbio.core.alignment.template.Profile;
028import org.biojava.nbio.core.alignment.template.SubstitutionMatrix;
029import org.biojava.nbio.alignment.template.GapPenalty.Type;
030import org.biojava.nbio.core.sequence.template.Compound;
031import org.biojava.nbio.core.sequence.template.CompoundSet;
032import org.biojava.nbio.core.sequence.template.Sequence;
033import org.slf4j.Logger;
034import org.slf4j.LoggerFactory;
035
036import java.util.ArrayList;
037import java.util.List;
038import java.util.concurrent.ExecutionException;
039import java.util.concurrent.Future;
040
041/**
042 * Implements common code for an {@link Aligner} for a pair of {@link Profile}s.
043 *
044 * @author Mark Chapman
045 * @param <S> each {@link Sequence} in the pair of alignment {@link Profile}s is of type S
046 * @param <C> each element of a sequence is a {@link Compound} of type C
047 */
048public abstract class AbstractProfileProfileAligner<S extends Sequence<C>, C extends Compound>
049                extends AbstractMatrixAligner<S, C> implements ProfileProfileAligner<S, C> {
050
051        private final static Logger logger = LoggerFactory.getLogger(AbstractProfileProfileAligner.class);
052
053        // additional input fields
054        private Profile<S, C> query, target;
055
056        // concurrent execution fields
057        private Future<ProfilePair<S, C>> queryFuture, targetFuture;
058
059        // cached fields
060        private List<C> cslist;
061        private float[][] qfrac, tfrac;
062
063        // additional output field
064        protected ProfilePair<S, C> pair;
065
066        /**
067         * Before running a profile-profile alignment, data must be sent in via calls to
068         * {@link #setQuery(Profile)}, {@link #setTarget(Profile)}, {@link #setGapPenalty(GapPenalty)}, and
069         * {@link #setSubstitutionMatrix(SubstitutionMatrix)}.
070         */
071        protected AbstractProfileProfileAligner() {
072        }
073
074        /**
075         * Prepares for a profile-profile alignment.
076         *
077         * @param query the first {@link Profile} of the pair to align
078         * @param target the second {@link Profile} of the pair to align
079         * @param gapPenalty the gap penalties used during alignment
080         * @param subMatrix the set of substitution scores used during alignment
081         */
082        protected AbstractProfileProfileAligner(Profile<S, C> query, Profile<S, C> target, GapPenalty gapPenalty,
083                        SubstitutionMatrix<C> subMatrix) {
084                super(gapPenalty, subMatrix);
085                this.query = query;
086                this.target = target;
087                reset();
088        }
089
090        /**
091         * Prepares for a profile-profile alignment run concurrently.
092         *
093         * @param query the first {@link Profile} of the pair to align, still to be calculated
094         * @param target the second {@link Profile} of the pair to align, still to be calculated
095         * @param gapPenalty the gap penalties used during alignment
096         * @param subMatrix the set of substitution scores used during alignment
097         */
098        protected AbstractProfileProfileAligner(Future<ProfilePair<S, C>> query, Future<ProfilePair<S, C>> target,
099                        GapPenalty gapPenalty, SubstitutionMatrix<C> subMatrix) {
100                super(gapPenalty, subMatrix);
101                queryFuture = query;
102                targetFuture = target;
103                reset();
104        }
105
106        /**
107         * Prepares for a profile-profile alignment run concurrently.
108         *
109         * @param query the first {@link Profile} of the pair to align
110         * @param target the second {@link Profile} of the pair to align, still to be calculated
111         * @param gapPenalty the gap penalties used during alignment
112         * @param subMatrix the set of substitution scores used during alignment
113         */
114        protected AbstractProfileProfileAligner(Profile<S, C> query, Future<ProfilePair<S, C>> target,
115                        GapPenalty gapPenalty, SubstitutionMatrix<C> subMatrix) {
116                super(gapPenalty, subMatrix);
117                this.query = query;
118                targetFuture = target;
119                reset();
120        }
121
122        /**
123         * Prepares for a profile-profile alignment run concurrently.
124         *
125         * @param query the first {@link Profile} of the pair to align, still to be calculated
126         * @param target the second {@link Profile} of the pair to align
127         * @param gapPenalty the gap penalties used during alignment
128         * @param subMatrix the set of substitution scores used during alignment
129         */
130        protected AbstractProfileProfileAligner(Future<ProfilePair<S, C>> query, Profile<S, C> target,
131                        GapPenalty gapPenalty, SubstitutionMatrix<C> subMatrix) {
132                super(gapPenalty, subMatrix);
133                queryFuture = query;
134                this.target = target;
135                reset();
136        }
137
138        /**
139         * Sets the query {@link Profile}.
140         *
141         * @param query the first {@link Profile} of the pair to align
142         */
143        public void setQuery(Profile<S, C> query) {
144                this.query = query;
145                queryFuture = null;
146                reset();
147        }
148
149        /**
150         * Sets the target {@link Profile}.
151         *
152         * @param target the second {@link Profile} of the pair to align
153         */
154        public void setTarget(Profile<S, C> target) {
155                this.target = target;
156                targetFuture = null;
157                reset();
158        }
159
160        // method for ProfileProfileAligner
161
162        @Override
163        public ProfilePair<S, C> getPair() {
164                if (pair == null) {
165                        align();
166                }
167                return pair;
168        }
169
170        // methods for ProfileProfileScorer
171
172        @Override
173        public Profile<S, C> getQuery() {
174                return query;
175        }
176
177        @Override
178        public Profile<S, C> getTarget() {
179                return target;
180        }
181
182        // methods for AbstractMatrixAligner
183
184        @Override
185        protected CompoundSet<C> getCompoundSet() {
186                return (query == null) ? null : query.getCompoundSet();
187        }
188
189        @Override
190        protected List<C> getCompoundsOfQuery() {
191                // TODO replace with consensus sequence
192                return (query == null) ? new ArrayList<C>() : query.getAlignedSequence(1).getAsList();
193        }
194
195        @Override
196        protected List<C> getCompoundsOfTarget() {
197                // TODO replace with consensus sequence
198                return (target == null) ? new ArrayList<C>() : target.getAlignedSequence(1).getAsList();
199        }
200
201        @Override
202        protected int[] getScoreMatrixDimensions() {
203                return new int[] { query.getLength() + 1, target.getLength() + 1, (getGapPenalty().getType() == Type.LINEAR) ?
204                                1 : 3 };
205        }
206
207        @Override
208        protected int getSubstitutionScore(int queryColumn, int targetColumn) {
209                return getSubstitutionScore(qfrac[queryColumn - 1], tfrac[targetColumn - 1]);
210        }
211
212        @Override
213        protected boolean isReady() {
214                // TODO when added to ConcurrencyTools, log completions and exceptions instead of printing stack traces
215                try {
216                        if (query == null && queryFuture != null) {
217                                query = queryFuture.get();
218                        }
219                        if (target == null && targetFuture != null) {
220                                target = targetFuture.get();
221                        }
222                        reset();
223                } catch (InterruptedException e) {
224                        logger.error("Interrupted Exception: ", e);
225                } catch (ExecutionException e) {
226                        logger.error("Execution Exception: ", e);
227                }
228                return query != null && target != null && getGapPenalty() != null && getSubstitutionMatrix() != null &&
229                                query.getCompoundSet().equals(target.getCompoundSet());
230        }
231
232        @Override
233        protected void reset() {
234                super.reset();
235                pair = null;
236                if (query != null && target != null && getGapPenalty() != null && getSubstitutionMatrix() != null &&
237                                query.getCompoundSet().equals(target.getCompoundSet())) {
238                        int maxq = 0, maxt = 0;
239                        cslist = query.getCompoundSet().getAllCompounds();
240                        qfrac = new float[query.getLength()][];
241                        for (int i = 0; i < qfrac.length; i++) {
242                                qfrac[i] = query.getCompoundWeightsAt(i + 1, cslist);
243                                maxq += getSubstitutionScore(qfrac[i], qfrac[i]);
244                        }
245                        tfrac = new float[target.getLength()][];
246                        for (int i = 0; i < tfrac.length; i++) {
247                                tfrac[i] = target.getCompoundWeightsAt(i + 1, cslist);
248                                maxt += getSubstitutionScore(tfrac[i], tfrac[i]);
249                        }
250                        max = Math.max(maxq, maxt);
251                        score = min = isLocal() ? 0 : (int) (2 * getGapPenalty().getOpenPenalty() + (query.getLength() +
252                                        target.getLength()) * getGapPenalty().getExtensionPenalty());
253                }
254        }
255
256        // helper method that scores alignment of two column vectors
257        private int getSubstitutionScore(float[] qv, float[] tv) {
258                float score = 0.0f;
259                for (int q = 0; q < qv.length; q++) {
260                        if (qv[q] > 0.0f) {
261                                for (int t = 0; t < tv.length; t++) {
262                                        if (tv[t] > 0.0f) {
263                                                score += qv[q]*tv[t]*getSubstitutionMatrix().getValue(cslist.get(q), cslist.get(t));
264                                        }
265                                }
266                        }
267                }
268                return Math.round(score);
269        }
270
271}