1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283
|
/***************************************************************************
* Copyright (C) 2009 by BUI Quang Minh *
* minh.bui@univie.ac.at *
* *
* This program is free software; you can redistribute it and/or modify *
* it under the terms of the GNU General Public License as published by *
* the Free Software Foundation; either version 2 of the License, or *
* (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program; if not, write to the *
* Free Software Foundation, Inc., *
* 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. *
***************************************************************************/
#ifndef MODELFACTORY_H
#define MODELFACTORY_H
#include "utils/tools.h"
#include "modelsubst.h"
#include "rateheterogeneity.h"
#include "nclextra/modelsblock.h"
#include "utils/checkpoint.h"
#include "alignment/alignment.h"
const double MIN_BRLEN_SCALE = 0.01;
const double MAX_BRLEN_SCALE = 100.0;
ModelsBlock *readModelsDefinition(Params ¶ms);
/**
return the position of +H or *H in the model name
@param model_name model name string
@return position of +H or *H in the model string, string::npos if not found
*/
string::size_type posRateHeterotachy(string &model_name);
/**
return the position of +R or *R in the model name
@param model_name model name string
@return position of +R or *R in the model string, string::npos if not found
*/
string::size_type posRateFree(string &model_name);
/**
return the position of +P or *P in the model name
@param model_name model name string
@return position of +P or *P in the model string, string::npos if not found
*/
string::size_type posPOMO(string &model_name);
/**
Store the transition matrix corresponding to evolutionary time so that one must not compute again.
For efficiency purpose esp. for protein (20x20) or codon (61x61).
The values of the map contain 3 matricies consecutively: transition matrix, 1st, and 2nd derivative
@author BUI Quang Minh <minh.bui@univie.ac.at>
*/
class ModelFactory : public unordered_map<int, double*>, public Optimization, public CheckpointFactory
{
public:
/**
constructor
create substitution model with possible rate heterogeneity. Create proper class objects
for two variables: model and site_rate. It takes the following field of params into account:
num_rate_cats, freq_type, store_trans_matrix
@param params program parameters
@param model_name full model name
@param tree associated phylogenetic tree
*/
ModelFactory(Params ¶ms, string &model_name, PhyloTree *tree, ModelsBlock *models_block);
/**
blank constructor
*/
ModelFactory();
/**
set checkpoint object
@param checkpoint
*/
virtual void setCheckpoint(Checkpoint *checkpoint);
/**
start structure for checkpointing
*/
virtual void startCheckpoint();
/**
save object into the checkpoint
*/
virtual void saveCheckpoint();
/**
restore object from the checkpoint
*/
virtual void restoreCheckpoint();
/**
get the name of the model
*/
//string getModelName();
virtual void writeInfo(ostream &out) {}
/**
Start to store transition matrix for efficiency
*/
void startStoringTransMatrix();
/**
Stop storing transition matrix, e.g., when optimizing model parameters
*/
void stopStoringTransMatrix();
/**
Wrapper for computing the transition probability matrix from the model. It use ModelFactory
that stores matrix computed before for effiency purpose.
@param time time between two events
@param mixture (optional) class for mixture model
@param trans_matrix (OUT) the transition matrix between all pairs of states.
Assume trans_matrix has size of num_states * num_states.
*/
void computeTransMatrix(double time, double *trans_matrix, int mixture = 0);
/**
Wrapper for computing the transition probability between two states.
@param time time between two events
@param state1 first state
@param state2 second state
*/
double computeTrans(double time, int state1, int state2);
/**
Wrapper for computing the transition probability between two states
@param time time between two events
@param state1 first state
@param state2 second state
@param derv1 (OUT) 1st derivative
@param derv2 (OUT) 2nd derivative
*/
virtual double computeTrans(double time, int state1, int state2, double &derv1, double &derv2);
/**
Wrapper for computing the transition probability matrix and the derivative 1 and 2 from the model.
It use ModelFactory that stores matrix computed before for effiency purpose.
@param time time between two events
@param mixture (optional) class for mixture model
@param trans_matrix (OUT) the transition matrix between all pairs of states.
Assume trans_matrix has size of num_states * num_states.
@param trans_derv1 (OUT) the 1st derivative matrix between all pairs of states.
@param trans_derv2 (OUT) the 2nd derivative matrix between all pairs of states.
*/
void computeTransDerv(double time, double *trans_matrix,
double *trans_derv1, double *trans_derv2, int mixture = 0);
/**
destructor
*/
virtual ~ModelFactory();
/**
* @param brlen_type either BRLEN_OPTIMIZE, BRLEN_FIX or BRLEN_SCALE
* @return #parameters of the model + # branches
*/
virtual int getNParameters(int brlen_type);
/**
optimize model parameters and tree branch lengths
NOTE 2016-08-20: refactor the semantic of fixed_len
@param fixed_len 0: optimize branch lengths, 1: fix branch lengths, 2: scale branch lengths
@param write_info TRUE to write model parameters every optimization step, FALSE to only print at the end
@param logl_epsilon log-likelihood epsilon to stop
@param gradient_epsilon gradient (derivative) epsilon to stop
@return the best likelihood
*/
virtual double optimizeParameters(int fixed_len = BRLEN_OPTIMIZE, bool write_info = true,
double logl_epsilon = 0.1, double gradient_epsilon = 0.0001);
/**
* optimize model parameters and tree branch lengths for the +I+G model
* using restart strategy.
* @param fixed_len TRUE to fix branch lengths, default is false
* @return the best likelihood
*/
virtual double optimizeParametersGammaInvar(int fixed_len = BRLEN_OPTIMIZE, bool write_info = true,
double logl_epsilon = 0.1, double gradient_epsilon = 0.0001);
/**
* @return TRUE if parameters are at the boundary that may cause numerical unstability
*/
virtual bool isUnstableParameters();
/**
pointer to the model, will not be deleted when deleting ModelFactory object
*/
ModelSubst *model;
/**
pointer to the site-rate heterogeneity, will not be deleted when deleting ModelFactory object
*/
RateHeterogeneity *site_rate;
/* TRUE if a fused mixture and rate model, e.g. LG4M and LG4X */
bool fused_mix_rate;
/**
TRUE to store transition matrix into this hash table for computation efficiency
*/
bool store_trans_matrix;
/**
TRUE for storing process
*/
bool is_storing;
/**
* encoded constant sites that are unobservable and added in the alignment
* this involves likelihood function for ascertainment bias correction for morphological or SNP data (Lewis 2001)
*/
string unobserved_ptns;
/**
* optimize model and site_rate parameters
* @param gradient_epsilon to control stop
* @param cur_logl current log-likelihood
*/
double optimizeParametersOnly(int num_steps, double gradient_epsilon, double cur_logl);
/************* FOLLOWING FUNCTIONS SERVE FOR JOINT OPTIMIZATION OF MODEL AND RATE PARAMETERS *******/
/**
* TRUE to optimize all parameters simultaneously, default: FALSE
*/
bool joint_optimize;
/**
return the number of dimensions
*/
virtual int getNDim();
/**
the target function which needs to be optimized
@param x the input vector x
@return the function value at x
*/
virtual double targetFunk(double x[]);
double initGTRGammaIParameters(RateHeterogeneity *rate, ModelSubst *model, double initAlpha,
double initPInvar, double *initRates, double *initStateFreqs);
double optimizeAllParameters(double gradient_epsilon);
protected:
/**
this function is served for the multi-dimension optimization. It should pack the model parameters
into a vector that is index from 1 (NOTE: not from 0)
@param variables (OUT) vector of variables, indexed from 1
*/
virtual void setVariables(double *variables);
/**
this function is served for the multi-dimension optimization. It should assign the model parameters
from a vector of variables that is index from 1 (NOTE: not from 0)
@param variables vector of variables, indexed from 1
@return TRUE if parameters are changed, FALSE otherwise (2015-10-20)
*/
virtual bool getVariables(double *variables);
vector<double> optimizeGammaInvWithInitValue(int fixed_len, double logl_epsilon, double gradient_epsilon,
double initPInv, double initAlpha, DoubleVector &lenvec, Checkpoint *model_ckp);
};
#endif
|