有一个revcumsum函数
library(spatstat.utils)
dt[, roll_cumsum2 := revcumsum(a), group]
-输出
dt
# a group roll_cumsum roll_cumsum2
# 1: 1 1 15 15
# 2: 2 1 14 14
# 3: 3 1 12 12
# 4: 4 1 9 9
# 5: 5 1 5 5
# 6: 6 2 40 40
# 7: 7 2 34 34
# 8: 8 2 27 27
# 9: 9 2 19 19
#10: 10 2 10 10
或者只是做reverse
dt[, roll_cumsum2 := rev(cumsum(rev(a))), group]
-输出
dt
# a group roll_cumsum roll_cumsum2
# 1: 1 1 15 15
# 2: 2 1 14 14
# 3: 3 1 12 12
# 4: 4 1 9 9
# 5: 5 1 5 5
# 6: 6 2 40 40
# 7: 7 2 34 34
# 8: 8 2 27 27
# 9: 9 2 19 19
#10: 10 2 10 10
或者另一种方式是
dt[, roll_cumsum2 := cumsum(a[.N:1])[.N:1], group]
注意:两者都是精简版
基准测试
dt1 <- data.table(a = 1:1e7, group = rep(1:1e6, length.out = 1e7, 10))
system.time(dt1[, roll_cumsum := partial_sum(a), by = group])
#user system elapsed
# 2.073 0.037 2.094
system.time(dt1[, roll_cumsum2 := revcumsum(a), group])
#user system elapsed
# 2.623 0.029 2.637
system.time(dt1[, roll_cumsum3 := rev(cumsum(rev(a))), group])
#user system elapsed
# 4.275 0.051 4.276
system.time(dt1[, roll_cumsum4 := cumsum(a[.N:1])[.N:1], group])
#user system elapsed
# 1.703 0.028 1.722
system.time(dt1[, roll_cumsum5 := sum(a) - cumsum(shift(a, fill = 0)), group])
# user system elapsed
# 10.095 0.041 10.129