A
> library(data.table)
> my_dt <- data.table(
+ var1 = sample(c('a', 'b'), 2000, replace = TRUE),
+ var2 = rnorm(2000)
+ )
>
> my_dt[, tg := sample(c('train', 'test', 'validate'), .N, TRUE, c(.7, .15, .15))]
> my_dt[, .N / my_dt[, .N], by = tg]
tg V1
1: train 0.6975
2: validate 0.1610
3: test 0.1415