Line data Source code
1 : /* +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
2 : Copyright (c) 2014-2023 The plumed team
3 : (see the PEOPLE file at the root of the distribution for a list of names)
4 :
5 : See http://www.plumed.org for more information.
6 :
7 : This file is part of plumed, version 2.
8 :
9 : plumed is free software: you can redistribute it and/or modify
10 : it under the terms of the GNU Lesser General Public License as published by
11 : the Free Software Foundation, either version 3 of the License, or
12 : (at your option) any later version.
13 :
14 : plumed is distributed in the hope that it will be useful,
15 : but WITHOUT ANY WARRANTY; without even the implied warranty of
16 : MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 : GNU Lesser General Public License for more details.
18 :
19 : You should have received a copy of the GNU Lesser General Public License
20 : along with plumed. If not, see <http://www.gnu.org/licenses/>.
21 : +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ */
22 : #include "core/ActionAtomistic.h"
23 : #include "core/ActionPilot.h"
24 : #include "core/ActionRegister.h"
25 : #include "core/ActionWithValue.h"
26 : #include "tools/Vector.h"
27 : #include "tools/Matrix.h"
28 : #include "tools/AtomNumber.h"
29 : #include "tools/Tools.h"
30 : #include "tools/RMSD.h"
31 : #include "core/PlumedMain.h"
32 : #include "core/ActionSet.h"
33 : #include "core/GenericMolInfo.h"
34 : #include "core/PbcAction.h"
35 : #include "tools/PDB.h"
36 : #include "tools/Pbc.h"
37 :
38 : #include <vector>
39 : #include <string>
40 : #include <memory>
41 :
42 : namespace PLMD {
43 : namespace generic {
44 :
45 : //+PLUMEDOC GENERIC FIT_TO_TEMPLATE
46 : /*
47 : This action is used to align a molecule to a template.
48 :
49 : This can be used to move the coordinates stored in plumed
50 : so as to be aligned with a provided template in PDB format. Pdb should contain
51 : also weights for alignment (see the format of PDB files used e.g. for \ref RMSD).
52 : Make sure your PDB file is correctly formatted as explained \ref pdbreader "in this page".
53 : Weights for displacement are ignored, since no displacement is computed here.
54 : Notice that all atoms (not only those in the template) are aligned.
55 : To see what effect try
56 : the \ref DUMPATOMS directive to output the atomic positions.
57 :
58 : Also notice that PLUMED propagate forces correctly so that you can add a bias on a CV computed
59 : after alignment. For many CVs this has no effect, but in some case the alignment can
60 : change the result. Examples are:
61 : - \ref POSITION CV since it is affected by a rigid shift of the system.
62 : - \ref DISTANCE CV with COMPONENTS. Since the alignment could involve a rotation (with TYPE=OPTIMAL) the actual components could be different
63 : from the original ones.
64 : - \ref CELL components for a similar reason.
65 : - \ref DISTANCE from a \ref FIXEDATOM, provided the fixed atom is introduced _after_ the \ref FIT_TO_TEMPLATE action.
66 :
67 : \attention
68 : The implementation of TYPE=OPTIMAL is available but should be considered in testing phase. Please report any
69 : strange behavior.
70 :
71 : \attention
72 : This directive modifies the stored position at the precise moment
73 : it is executed. This means that only collective variables
74 : which are below it in the input script will see the corrected positions.
75 : As a general rule, put it at the top of the input file. Also, unless you
76 : know exactly what you are doing, leave the default stride (1), so that
77 : this action is performed at every MD step.
78 :
79 : When running with periodic boundary conditions, the atoms should be
80 : in the proper periodic image. This is done automatically since PLUMED 2.5,
81 : by considering the ordered list of atoms and rebuilding the molecules using a procedure
82 : that is equivalent to that done in \ref WHOLEMOLECULES . Notice that
83 : rebuilding is local to this action. This is different from \ref WHOLEMOLECULES
84 : which actually modifies the coordinates stored in PLUMED.
85 :
86 : In case you want to recover the old behavior you should use the NOPBC flag.
87 : In that case you need to take care that atoms are in the correct
88 : periodic image.
89 :
90 : \par Examples
91 :
92 : Align the atomic position to a template then print them.
93 : The following example is only translating the system so as
94 : to align the center of mass of a molecule to the one in the reference
95 : structure `ref.pdb`:
96 : \plumedfile
97 : # dump coordinates before fitting, to see the difference:
98 : DUMPATOMS FILE=dump-before.xyz ATOMS=1-20
99 :
100 : # fit coordinates to ref.pdb template
101 : # this is a "TYPE=SIMPLE" fit, so that only translations are used.
102 : FIT_TO_TEMPLATE STRIDE=1 REFERENCE=ref.pdb TYPE=SIMPLE
103 :
104 : # dump coordinates after fitting, to see the difference:
105 : DUMPATOMS FILE=dump-after.xyz ATOMS=1-20
106 : \endplumedfile
107 :
108 : The following example instead performs a rototranslational fit.
109 : \plumedfile
110 : # dump coordinates before fitting, to see the difference:
111 : DUMPATOMS FILE=dump-before.xyz ATOMS=1-20
112 :
113 : # fit coordinates to ref.pdb template
114 : # this is a "TYPE=OPTIMAL" fit, so that rototranslations are used.
115 : FIT_TO_TEMPLATE STRIDE=1 REFERENCE=ref.pdb TYPE=OPTIMAL
116 :
117 : # dump coordinates after fitting, to see the difference:
118 : DUMPATOMS FILE=dump-after.xyz ATOMS=1-20
119 : \endplumedfile
120 :
121 : In both these cases the reference structure should be provided in a reference pdb file such as the one below:
122 :
123 : \auxfile{ref.pdb}
124 : ATOM 8 HT3 ALA 2 -1.480 -1.560 1.212 1.00 1.00 DIA H
125 : ATOM 9 CAY ALA 2 -0.096 2.144 -0.669 1.00 1.00 DIA C
126 : ATOM 10 HY1 ALA 2 0.871 2.385 -0.588 1.00 1.00 DIA H
127 : ATOM 12 HY3 ALA 2 -0.520 2.679 -1.400 1.00 1.00 DIA H
128 : ATOM 14 OY ALA 2 -1.139 0.931 -0.973 1.00 1.00 DIA O
129 : END
130 : \endauxfile
131 :
132 : In the following example you see two completely equivalent way
133 : to restrain an atom close to a position that is defined in the reference
134 : frame of an aligned molecule. You could for instance use this command to calculate the
135 : position of the center of mass of a ligand after having aligned the atoms to the reference
136 : frame of the protein that is determined by aligning the atoms in the protein to the coordinates
137 : provided in the file ref.pdb
138 : \plumedfile
139 : # center of the ligand:
140 : center: CENTER ATOMS=100-110
141 :
142 : FIT_TO_TEMPLATE REFERENCE=ref.pdb TYPE=OPTIMAL
143 :
144 : # place a fixed atom in the protein reference coordinates:
145 : fix: FIXEDATOM AT=1.0,1.1,1.0
146 :
147 : # take the distance between the fixed atom and the center of the ligand
148 : d: DISTANCE ATOMS=center,fix
149 :
150 : # apply a restraint
151 : RESTRAINT ARG=d AT=0.0 KAPPA=100.0
152 : \endplumedfile
153 :
154 : Notice that you could have obtained an (almost) identical result by adding a fictitious
155 : atom to `ref.pdb` with the serial number corresponding to the atom labelled `center` (there is no automatic way
156 : to get it, but in this example it should be the number of atoms of the system plus one),
157 : and properly setting the weights for alignment and displacement in \ref RMSD.
158 : There are two differences to be expected:
159 : (ab) \ref FIT_TO_TEMPLATE might be slower since it has to rototranslate all the available atoms and
160 : (b) variables employing periodic boundary conditions (such as \ref DISTANCE without `NOPBC`, as in the example above)
161 : are allowed after \ref FIT_TO_TEMPLATE, whereas \ref RMSD expects the issues related to the periodic boundary conditions to be already solved.
162 : The latter means that before the \ref RMSD statement one should use \ref WRAPAROUND or \ref WHOLEMOLECULES to properly place
163 : the ligand.
164 :
165 :
166 : */
167 : //+ENDPLUMEDOC
168 :
169 :
170 : class FitToTemplate:
171 : public ActionPilot,
172 : public ActionAtomistic,
173 : public ActionWithValue {
174 : std::string type;
175 : bool nopbc;
176 : std::vector<double> weights;
177 : std::vector<std::pair<std::size_t,std::size_t> > p_aligned;
178 : Vector center;
179 : Vector shift;
180 : // optimal alignment related stuff
181 : std::unique_ptr<PLMD::RMSD> rmsd;
182 : Tensor rotation;
183 : Matrix< std::vector<Vector> > drotdpos;
184 : // not used anymore (see notes below at doNotRetrieve())
185 : // std::vector<Vector> positions;
186 : std::vector<Vector> DDistDRef;
187 : std::vector<Vector> ddistdpos;
188 : std::vector<Vector> centeredpositions;
189 : Vector center_positions;
190 : // Copy of the box value
191 : Value* boxValue;
192 : PbcAction* pbc_action;
193 : public:
194 : explicit FitToTemplate(const ActionOptions&ao);
195 : static void registerKeywords( Keywords& keys );
196 55 : bool actionHasForces() override {
197 55 : return true;
198 : }
199 : void calculate() override;
200 : void apply() override;
201 0 : unsigned getNumberOfDerivatives() override {
202 0 : plumed_merror("You should not call this function");
203 : };
204 : };
205 :
206 : PLUMED_REGISTER_ACTION(FitToTemplate,"FIT_TO_TEMPLATE")
207 :
208 13 : void FitToTemplate::registerKeywords( Keywords& keys ) {
209 13 : Action::registerKeywords( keys );
210 13 : ActionAtomistic::registerKeywords( keys );
211 26 : keys.add("compulsory","STRIDE","1","the frequency with which molecules are reassembled. Unless you are completely certain about what you are doing leave this set equal to 1!");
212 26 : keys.add("compulsory","REFERENCE","a file in pdb format containing the reference structure and the atoms involved in the CV.");
213 26 : keys.add("compulsory","TYPE","SIMPLE","the manner in which RMSD alignment is performed. Should be OPTIMAL or SIMPLE.");
214 26 : keys.addFlag("NOPBC",false,"ignore the periodic boundary conditions when calculating distances");
215 13 : }
216 :
217 9 : FitToTemplate::FitToTemplate(const ActionOptions&ao):
218 : Action(ao),
219 : ActionPilot(ao),
220 : ActionAtomistic(ao),
221 : ActionWithValue(ao),
222 18 : nopbc(false) {
223 : std::string reference;
224 9 : parse("REFERENCE",reference);
225 9 : type.assign("SIMPLE");
226 9 : parse("TYPE",type);
227 :
228 9 : parseFlag("NOPBC",nopbc);
229 : // if(type!="SIMPLE") error("Only TYPE=SIMPLE is implemented in FIT_TO_TEMPLATE");
230 :
231 9 : checkRead();
232 :
233 9 : PDB pdb;
234 :
235 : // read everything in ang and transform to nm if we are not in natural units
236 9 : if( !pdb.read(reference,usingNaturalUnits(),0.1/getUnits().getLength()) ) {
237 0 : error("missing input file " + reference );
238 : }
239 :
240 9 : requestAtoms(pdb.getAtomNumbers());
241 9 : log.printf(" found %zu atoms in input \n",pdb.getAtomNumbers().size());
242 9 : log.printf(" with indices : ");
243 42 : for(unsigned i=0; i<pdb.getAtomNumbers().size(); ++i) {
244 33 : if(i%25==0) {
245 9 : log<<"\n";
246 : }
247 33 : log.printf("%d ",pdb.getAtomNumbers()[i].serial());
248 : }
249 9 : log.printf("\n");
250 :
251 9 : std::vector<Vector> positions=pdb.getPositions();
252 9 : weights=pdb.getOccupancy();
253 9 : std::vector<AtomNumber> aligned=pdb.getAtomNumbers();
254 9 : p_aligned.resize( aligned.size() );
255 42 : for(unsigned i=0; i<aligned.size(); ++i) {
256 33 : p_aligned[i] = getValueIndices( aligned[i] );
257 : }
258 :
259 :
260 : // normalize weights
261 : double n=0.0;
262 42 : for(unsigned i=0; i<weights.size(); ++i) {
263 33 : n+=weights[i];
264 : }
265 9 : if(n==0.0) {
266 0 : error("PDB file " + reference + " has zero weights. Please check the occupancy column.");
267 : }
268 9 : n=1.0/n;
269 42 : for(unsigned i=0; i<weights.size(); ++i) {
270 33 : weights[i]*=n;
271 : }
272 :
273 : // normalize weights for rmsd calculation
274 9 : std::vector<double> weights_measure=pdb.getBeta();
275 : n=0.0;
276 42 : for(unsigned i=0; i<weights_measure.size(); ++i) {
277 33 : n+=weights_measure[i];
278 : }
279 9 : n=1.0/n;
280 42 : for(unsigned i=0; i<weights_measure.size(); ++i) {
281 33 : weights_measure[i]*=n;
282 : }
283 :
284 : // subtract the center
285 42 : for(unsigned i=0; i<weights.size(); ++i) {
286 33 : center+=positions[i]*weights[i];
287 : }
288 42 : for(unsigned i=0; i<weights.size(); ++i) {
289 33 : positions[i]-=center;
290 : }
291 :
292 13 : if(type=="OPTIMAL" or type=="OPTIMAL-FAST" ) {
293 5 : rmsd=Tools::make_unique<RMSD>();
294 5 : rmsd->set(weights,weights_measure,positions,type,false,false);// note: the reference is shifted now with center in the origin
295 10 : log<<" Method chosen for fitting: "<<rmsd->getMethod()<<" \n";
296 : }
297 9 : if(nopbc) {
298 1 : log<<" Ignoring PBCs when doing alignment, make sure your molecule is whole!<n";
299 : }
300 : // register the value of rmsd (might be useful sometimes)
301 9 : addValue();
302 9 : setNotPeriodic();
303 :
304 : // I remove this optimization now in order to use makeWhole()
305 : // Notice that for FIT_TO_TEMPLATE TYPE=OPTIMAL a copy was made anyway
306 : // (due to the need to store position to propagate forces on rotational matrix later)
307 : // For FIT_TO_TEMPLATE TYPE=SIMPLE in principle we could use it and write an ad hoc
308 : // version of makeWhole that only computes the center. Too lazy to do it now.
309 : // In case we do it later, remember that uncommenting this line means that
310 : // getPositions will not work anymore! GB
311 : // doNotRetrieve();
312 :
313 : // this is required so as to allow modifyGlobalForce() to return correct
314 : // also for forces that are not owned (and thus not zeored) by all processors.
315 9 : pbc_action=plumed.getActionSet().selectWithLabel<PbcAction*>("Box");
316 9 : if( !pbc_action ) {
317 0 : error("cannot align box has not been set");
318 : }
319 9 : boxValue=pbc_action->copyOutput(0);
320 18 : }
321 :
322 :
323 108 : void FitToTemplate::calculate() {
324 :
325 108 : if(!nopbc) {
326 96 : makeWhole();
327 : }
328 :
329 108 : if (type=="SIMPLE") {
330 48 : Vector cc;
331 :
332 144 : for(unsigned i=0; i<p_aligned.size(); ++i) {
333 96 : cc+=weights[i]*getPosition(i);
334 : }
335 :
336 48 : shift=center-cc;
337 48 : setValue(shift.modulo());
338 48 : unsigned nat = getTotAtoms();
339 6384 : for(unsigned i=0; i<nat; i++) {
340 6336 : std::pair<std::size_t,std::size_t> a = getValueIndices( AtomNumber::index(i));
341 6336 : Vector ato=getGlobalPosition(a);
342 6336 : setGlobalPosition(a,ato+shift);
343 : }
344 60 : } else if( type=="OPTIMAL" or type=="OPTIMAL-FAST") {
345 : // specific stuff that provides all that is needed
346 60 : double r=rmsd->calc_FitElements( getPositions(), rotation, drotdpos, centeredpositions, center_positions);
347 60 : setValue(r);
348 60 : unsigned nat = getTotAtoms();
349 8004 : for(unsigned i=0; i<nat; i++) {
350 7944 : std::pair<std::size_t,std::size_t> a = getValueIndices( AtomNumber::index(i));
351 7944 : Vector ato=getGlobalPosition(a);
352 7944 : setGlobalPosition(a,matmul(rotation,ato-center_positions)+center);
353 : }
354 : // rotate box
355 60 : Pbc& pbc(pbc_action->getPbc());
356 60 : pbc.setBox(matmul(pbc_action->getPbc().getBox(),transpose(rotation)));
357 : }
358 108 : }
359 :
360 108 : void FitToTemplate::apply() {
361 108 : auto nat=getTotAtoms();
362 108 : if (type=="SIMPLE") {
363 48 : Vector totForce;
364 6384 : for(unsigned i=0; i<nat; i++) {
365 6336 : std::pair<std::size_t,std::size_t> a = getValueIndices( AtomNumber::index(i));
366 6336 : totForce+=getForce(a);
367 : }
368 48 : Tensor vv=Tensor(center,totForce);
369 192 : for(unsigned i=0; i<3; ++i)
370 576 : for(unsigned j=0; j<3; ++j) {
371 432 : boxValue->addForce( 3*i+j, vv(i,j) );
372 : }
373 144 : for(unsigned i=0; i<p_aligned.size(); ++i) {
374 96 : addForce( p_aligned[i], -totForce*weights[i]);
375 : }
376 60 : } else if ( type=="OPTIMAL" or type=="OPTIMAL-FAST") {
377 60 : Vector totForce;
378 8004 : for(unsigned i=0; i<nat; i++) {
379 7944 : std::pair<std::size_t,std::size_t> a = getValueIndices( AtomNumber::index(i));
380 7944 : Vector f=getForce(a);
381 : // rotate back forces
382 7944 : Vector nf=matmul(transpose(rotation),f);
383 7944 : addForce(a, nf-f);
384 : // accumulate rotated c.o.m. forces - this is already in the non rotated reference frame
385 7944 : totForce+=nf;
386 : }
387 60 : Tensor virial;
388 240 : for(unsigned i=0; i<3; ++i)
389 720 : for(unsigned j=0; j<3; ++j) {
390 540 : virial[i][j] = boxValue->getForce( 3*i+j );
391 : }
392 : // notice that an extra Tensor(center,matmul(rotation,totForce)) is required to
393 : // compute the derivatives of the rotation with respect to center
394 60 : Tensor ww=matmul(transpose(rotation),virial+Tensor(center,matmul(rotation,totForce)));
395 : // rotate back virial
396 60 : virial=matmul(transpose(rotation),matmul(virial,rotation));
397 :
398 : // now we compute the force due to alignment
399 360 : for(unsigned i=0; i<p_aligned.size(); i++) {
400 300 : Vector g;
401 1200 : for(unsigned k=0; k<3; k++) {
402 : // this could be made faster computing only the diagonal of d
403 900 : Tensor d=matmul(ww,RMSD::getMatrixFromDRot(drotdpos,i,k));
404 900 : g[k]=(d(0,0)+d(1,1)+d(2,2));
405 : }
406 : // here is the extra contribution
407 300 : addForce( p_aligned[i], -g-weights[i]*totForce );
408 : // here it the contribution to the virial
409 : // notice that here we can use absolute positions since, for the alignment to be defined,
410 : // positions should be in one well defined periodic image
411 300 : virial+=extProduct(getPosition(i),g);
412 : }
413 : // finally, correction to the virial
414 60 : boxValue->clearInputForce();
415 60 : virial+=extProduct(matmul(transpose(rotation),center),totForce);
416 240 : for(unsigned i=0; i<3; ++i)
417 720 : for(unsigned j=0; j<3; ++j) {
418 540 : boxValue->addForce( 3*i+j, virial(i,j) );
419 : }
420 : }
421 108 : }
422 :
423 : }
424 : }
|