The data is as follows:
cat <- c('A','A','A','B','B','A','C','B')
value <- c(1,1,1,2,2,1,3,2)
df <- data.frame(cat,value)
I want to create a new column which keeps the first occurrence of each 'cat'.
Order is important!
df$new <- ave(df$value, df$cat, FUN = function(z) c(z[1], rep(0, length(z)-1)))
df
# cat value new
# 1 A 1 1
# 2 A 1 0
# 3 A 1 0
# 4 B 2 2
# 5 B 2 0
# 6 A 1 0
# 7 C 3 3
# 8 B 2 0
library(dplyr)
df %>%
group_by(cat) %>%
mutate(new = if_else(row_number() == 1, value, 0)) %>%
ungroup()
# # A tibble: 8 x 3
# cat value new
# <chr> <dbl> <dbl>
# 1 A 1 1
# 2 A 1 0
# 3 A 1 0
# 4 B 2 2
# 5 B 2 0
# 6 A 1 0
# 7 C 3 3
# 8 B 2 0
or
df %>%
group_by(cat) %>%
mutate(new = c(value[1], rep(0, n() - 1))) %>%
ungroup()
library(data.table)
DF <- as.data.table(df)
DF[, new := c(value[1], rep(0, .N - 1)), by = .(cat)]
# cat value new
# <char> <num> <num>
# 1: A 1 1
# 2: A 1 0
# 3: A 1 0
# 4: B 2 2
# 5: B 2 0
# 6: A 1 0
# 7: C 3 3
# 8: B 2 0