forked from hackseq/hs19-flu
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathClade_label.R
19 lines (18 loc) · 1.09 KB
/
Clade_label.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
df=read.csv("Data",sep= ",",header=T,stringsAsFactors=FALSE)
names(df)=c("Clade","numberTipsClade","numberTipsTrimmed","sackin",
"colless","Variance","I2","B1","B2","avgLadder","ILnumber","pitchforks",
"maxHeight","MaxWidth","DelW","Stairs1","Stairs2","Cherries","BS","descinm","getstattest","skewness","kurtosis","MeanPairwiseDist","MaxPairwiseDist",
"diameter", "WienerIndex", "betweenness", "closeness", "eigenvector","MeadianEp","MaxEp","MeanEp")
allHeights=node.depth.edgelength(tree)
allD=allDescendants(tree)
TimeFrame=3.4
#nodeids are the ids if the clades (the first column of the data)
nodeids=df$Clade
nTips=length(tree$tip.label)
# # tips within the TimeFrame for each node
allTrimmedClades = sapply(nodeids, function(x) {myTipDes=allD[[x]][allD[[x]]<=nTips]
myTipTimes=allHeights[myTipDes] # here, would need something like allDates[myTipDesc]
return(myTipDes[myTipTimes <= allHeights[x]+TimeFrame]) })
# # sizes of trimmed clades
allTrimmedSizes_3.4 = sapply(allTrimmedClades, function(x) length(allTrimmedClades[x]))
Labels=allTrimmedSizes_3.4/df$numberTipsTrimmed