File: Yule.hs

package info (click to toggle)
bali-phy 4.0-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 15,392 kB
  • sloc: cpp: 120,442; xml: 13,966; haskell: 9,975; python: 2,936; yacc: 1,328; perl: 1,169; lex: 912; sh: 343; makefile: 26
file content (133 lines) | stat: -rw-r--r-- 5,777 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
module Probability.Distribution.Tree.Yule where

import           Tree
import           Probability.Random
import           Probability.Distribution.Uniform
import           Probability.Distribution.Tree.Modifiable
import           Probability.Distribution.Tree.Util
import           Probability.Distribution.Exponential
import qualified Data.IntMap as IntMap
import           Data.Text (Text)
import           Data.Maybe (isJust, fromJust)
import           MCMC
import           Data.Array

yulePrFactors :: (HasRoots t, HasNodeTimes t) => Int -> Rate -> t -> [LogDouble]
yulePrFactors n lambda tree = require (numLeaves tree == n)
                              : pow (toLogDouble lambda) (fromIntegral (n-2))
                              : [ expToLogDouble (-lambda * deltaT ) * require (deltaT >= 0)
                                      | node <- getNodes tree,
                                        let parent = parentNode tree node,
                                        isJust parent,
                                        let deltaT = (nodeTime tree (fromJust parent) - nodeTime tree node)
                                ]

-------------------------------------------------------------
timesToAges tree = modifyNodeTimes tree (maxTime -) where maxTime = maximum (nodeTimes tree)

-- This way of constructing the tree -- from the root to the tips, ensures that the tip
--    labels will look like 1,(3,4) or (3,4),2 when we have 3 leaves.
-- When a node i splits into two new nodes, we need to use i as the internal node name
--    because we already have a branch connected to it.
-- We could additionally sample integer labels [0..n-1] and randomly assign them to the tips.
--    When we hit the present we can shuffle the existing node numbers to assign labels [0..n]
-- Alternatively, we could also try arrange that the labels for each tip are actually a function
--    that passes additional labels to the ancestor.

sampleYule n lambda = do 

  let go :: Time -> Int -> [Int] -> ([Int],[(Int,Int)],[(Int,Double)]) -> Random ([Int], [(Int,Int)], [(Int,Double)])
      go t1 nextNode activeNodes (nodes, edges, nodeTimes) = do

              t2 <- (t1 +) <$> sample (exponential (1 / (lambda * (fromIntegral (length activeNodes)))))

              if length activeNodes == n then do
                  t2' <- sample $ uniform t1 t2
                  let nodeTimes' = [(node,t2') | node <- activeNodes] ++ nodeTimes
                  return (nodes, edges, nodeTimes')
              else do
                  (n0,rest) <- removeOne activeNodes
                  let n1 = nextNode
                      n2 = nextNode+1
                      nextNode' = nextNode + 2
                      nodes' = n1:n2:nodes
                      edges' = (n0,n1):(n0,n2):edges
                      nodeTimes' = (n0,t2):nodeTimes
                  go t2 nextNode'(n1:n2:rest) (nodes', edges', nodeTimes')

      t0 = 0
      nextNode0 = 3
      nodes0 = [0,1,2]
      edges0 = [(0,1),(0,2)]
      nodeTimes0 = [(0, t0)]
      activeNodes0 = [1,2]

  (nodes, edges, nodeTimes) <- go t0 nextNode0 activeNodes0 (nodes0, edges0, nodeTimes0)

  let root = 0
      topology = addRoot root (treeFromEdges nodes edges)
      timeTree = time_tree topology (IntMap.fromList nodeTimes)
      ageTree = timesToAges timeTree

  return ageTree

-------------------------------------------------------------

yuleEffect tree = do
  -- Resample all the node times, including the root...
  -- But what if some node times are fixed?
  -- FIXME: check that leaf times are fixed?
  -- sequence_ [ addMove 1 $ sliceSample (nodeTime tree node) (above 0) | node <- internalNodes tree]

  -- This allow attaching at the same level OR more rootward.
  -- FIXME: but it doesn't allow becoming the root!
  -- QUESTION: Could we slice sample the root location?
  -- QUESTION: Could we somehow propose a root location based on the likelihood/posterior?
  -- sequence_ [ addMove 1 $ metropolisHastings $ fnpr_unsafe_proposal tree node | node <- getNodes tree]

  -- Exchange sibling branches with children?
  addMove 1 $ walkTimeTreeSampleNNIandNodeTimes tree

-------------------------------------------------------------

data UnlabelledYule = UnlabelledYule Int Rate

instance Dist UnlabelledYule where
    type Result UnlabelledYule = WithNodeTimes (WithRoots (Tree ()))
    dist_name _ = "yule"

instance HasAnnotatedPdf UnlabelledYule where
    annotated_densities (UnlabelledYule n lambda) tree = return (yulePrFactors n lambda tree, ())

instance Sampleable UnlabelledYule where
    sample dist@(UnlabelledYule n lambda) = RanDistribution3 dist yuleEffect triggeredModifiableTimeTree (sampleYule n lambda)

unlabelledYule n lambda = UnlabelledYule n lambda

-------------------------------------------------------------
{-
   We need the random shuffling to be performed in the IO monad (which doesn't remember anything)
   during the initial sample.

   We do NOT want the shuffle to be performed in the Random monad, because we don't want its
   random choices to be remembered and then resampled during MCMC.
 -}

sampleLabeledYule labels lambda = do
  tree <- sample $ unlabelledYule (length labels) lambda
  leafIndices <- zip (leafNodes tree) <$> shuffle labels
  return $ addLabels leafIndices tree

data Yule l = Yule [l] Rate

instance Dist (Yule l) where
    type Result (Yule l) = WithNodeTimes (WithRoots (Tree l))
    dist_name _ = "Yule"

instance HasAnnotatedPdf (Yule l) where
    annotated_densities (Yule taxa lambda) tree = return (yulePrFactors (length taxa) lambda tree, ())

instance Sampleable (Yule l) where
    sample dist@(Yule taxa lambda) = RanDistribution3 dist yuleEffect triggeredModifiableTimeTree (sampleLabeledYule taxa lambda)

yule taxa lambda = Yule taxa lambda