您可以简单地使用phy$edge.length
生成的phylo
对象的DDD::L2phylo
组件:
## Measuring the sum of the branch lengths from `phy`
sum_br_length <- sum(phy$edge.length)
sum_br_length == Faith$PD
# [1] TRUE
## Measuring the sum of the branch length from `L`
sum_br_length <- sum(DDD::L2phylo(L,dropextinct = TRUE)$edge.length)
sum_br_length == Faith$PD
# [1] TRUE
一些微基准测试很有趣:
library(microbenchmark)
## Function 1
fun1 <- function(L) {
comm = as.data.frame(L) %>% dplyr::select(V3:V4) %>%
dplyr::rename(id = V3,pa = V4) %>%
dplyr::mutate(id = paste0("t",abs(id))) %>%
dplyr::mutate(pa = dplyr::if_else(pa == -1,1,0)) %>%
dplyr::mutate(plot = 0) %>%
dplyr::select(plot,pa,id) %>%
picante::sample2matrix()
# convert L table into phylogeny
phy = DDD::L2phylo(L,dropextinct = T)
# calculate Faith's index using pd() function
Faith = picante::pd(comm,phy)
return(Faith$PD)
}
## Function 2
fun2 <- function(L) {
phy <- DDD::L2phylo(L,dropextinct = T)
return(sum(phy$edge.length))
}
## Function 3
fun3 <- function(L) {
return(sum(DDD::L2phylo(L,dropextinct = TRUE)$edge.length))
}
## Do all of them give the same results
fun1(L) == Faith$PD
# [1] TRUE
fun2(L) == Faith$PD
# [1] TRUE
fun3(L) == Faith$PD
# [1] TRUE
## Which function fastest?
microbenchmark(fun1(L),fun2(L),fun3(L))
# Unit: milliseconds
# expr min lq mean median uq max neval
# fun1(L) 6.486462 6.900641 8.273386 7.445334 8.667535 16.888429 100
# fun2(L) 1.627854 1.683204 2.215531 1.771219 2.229408 9.522366 100
# fun3(L) 1.630635 1.663181 2.229206 1.859733 2.448196 7.573001 100
,
我检查了pd::sample2matrix
以了解其内部功能。 tapply
调用和以下行似乎是唯一必要的部分。
library(DDD)
library(tidyverse)
library(picante)
#> Loading required package: ape
#> Loading required package: vegan
#> Loading required package: permute
#> Loading required package: lattice
#> This is vegan 2.5-6
#> Loading required package: nlme
#>
#> Attaching package: 'nlme'
#> The following object is masked from 'package:dplyr':
#>
#> collapse
set.seed(100)
result <- dd_sim(c(0.2,0.1,20),10)
# with birth rate 0.2,death rate 0.1,carrying capacity 20 and overall 10 million years.
L <- result$L
# convert L table into community data matrix
comm_original = as.data.frame(L) %>% dplyr::select(V3:V4) %>%
dplyr::rename(id = V3,pa = V4) %>%
dplyr::mutate(id = paste0("t",abs(id))) %>%
dplyr::mutate(pa = dplyr::if_else(pa == -1,0)) %>%
dplyr::mutate(plot = 0) %>%
dplyr::select(plot,id) %>%
picante::sample2matrix()
# Instead of using dplyr,we'll do some base R operations
# on L. The code doesn't look as nice,but it should be
# significantly faster.
pa <- ifelse(L[,4] == -1,0)
plot <- rep(0,length(pa))
id <- paste0("t",abs(L[,3]))
comm_new <- tapply(pa,list(plot,id),sum)
comm_new[is.na(comm_new)] <- 0
# convert L table into phylogeny
phy = DDD::L2phylo(L,dropextinct = T)
# calculate Faith's index using pd() function
picante::pd(comm_original,phy)
#> PD SR
#> 0 29.82483 6
picante::pd(comm_new,phy)
#> PD SR
#> 0 29.82483 6
Created on 2019-11-17 by the reprex package (v0.3.0)
编辑:original()
是您最初构建comm
的方式,new()
是上面给出的方式。如果您将其交换,看来您可以期望将速度提高2倍。我知道这并不是很大的收益,具体取决于工作负载的大小,但总比没有好。
expression min median `itr/sec` mem_alloc `gc/sec` n_itr n_gc total_time result memory time gc
<bch:expr> <bch:tm> <bch:tm> <dbl> <bch:byt> <dbl> <int> <dbl> <bch:tm> <list> <list> <list> <list>
1 original() 9.76ms 10.24ms 96.1 552KB 2.04 47 1 489ms <df[,1125] [1 x 1,1~ <df[,3] [107 x~ <bch:t~ <tibble [48 x~
2 new() 4.57ms 4.84ms 201. 464KB 2.07 97 1 483ms <dbl[,~ <df[,3] [63 x ~ <bch:t~ <tibble [98 x~
本文链接:https://www.f2er.com/3103749.html