Create lags with a for-loop in R

Posted by cptn on Stack Overflow See other posts from Stack Overflow or by cptn
Published on 2014-06-01T07:47:45Z Indexed on 2014/06/01 15:27 UTC
Read the original article Hit count: 206

Filed under:
|
|
|

I've got a data.frame with stock data of several companies (here it's only two). I want 10 additional columns in my stock data.frame df with lagged dates (from -5 days to +5 days) for both companies in my event data.frame. I'm using a for loop which is probably not the best solution, but it works partially.

DATE <- c("01.01.2000","02.01.2000","03.01.2000","06.01.2000","07.01.2000","09.01.2000","10.01.2000","01.01.2000","02.01.2000","04.01.2000","06.01.2000","07.01.2000","09.01.2000","10.01.2000")
RET <- c(-2.0,1.1,3,1.4,-0.2, 0.6, 0.1, -0.21, -1.2, 0.9, 0.3, -0.1,0.3,-0.12)
COMP <- c("A","A","A","A","A","A","A","B","B","B","B","B","B","B")
df <- data.frame(DATE, RET, COMP, stringsAsFactors=F)

df

# DATE   RET COMP
# 1  01.01.2000 -2.00    A
# 2  02.01.2000  1.10    A
# 3  03.01.2000  3.00    A
# 4  06.01.2000  1.40    A
# 5  07.01.2000 -0.20    A
# 6  09.01.2000  0.60    A
# 7  10.01.2000  0.10    A
# 8  01.01.2000 -0.21    B
# 9  02.01.2000 -1.20    B
# 10 04.01.2000  0.90    B
# 11 06.01.2000  0.30    B
# 12 07.01.2000 -0.10    B
# 13 09.01.2000  0.30    B
# 14 10.01.2000 -0.12    B

this loop works fine

comp <- as.vector(unique(df$COMP))
mylist <- vector('list', length(comp))

# create lags in DATE
for(i in 1:length(comp)) {
  print(i)
  comp_i <- comp[i]
  df_k <- df[df$COMP %in% comp_i, ] # all trading days of one firm

  df_k <- transform(df_k, 
                      DATEm1 = c(NA, head(DATE, -1)), 
                      DATEm2 = c(NA, NA, head(DATE, -2)), 
                      DATEm3 = c(NA, NA, NA, head(DATE, -3)),
                      DATEm4 = c(NA, NA, NA, NA,head(DATE, -4)), 
                      DATEm5 = c(NA, NA, NA, NA, NA, head(DATE, -5)),
                      DATEp1 = c(DATE[-1], NA))
                     #DATEp2 = c(DATE[-2], NA, NA),
                     #DATEp3 = c(DATE[-3], NA, NA, NA),
                     #DATEp4 = c(DATE[-4], NA, NA, NA, NA),
                     #DATEp5 = c(DATE[-5], NA, NA, NA, NA, NA))

  mylist[[i]] = df_k
} 

df1 <- do.call(rbind, mylist)

But if I add the lines with DATEp2, DATEp3, DATEp4, DATEp5. the code doesn't work. Can anybody tell me what I'm doing wrong here? Here the code with all the lagged dates.

# create lags in DATE
for(i in 1:length(comp)) {
  print(i)
  comp_i <- comp[i]
  df_k <- df[df$COMP %in% comp_i, ] # all trading days of one firm

  df_k <- transform(df_k, 
                      DATEm1 = c(NA, head(DATE, -1)), 
                      DATEm2 = c(NA, NA, head(DATE, -2)), 
                      DATEm3 = c(NA, NA, NA, head(DATE, -3)),
                      DATEm4 = c(NA, NA, NA, NA,head(DATE, -4)), 
                      DATEm5 = c(NA, NA, NA, NA, NA, head(DATE, -5)),
                      DATEp1 = c(DATE[-1], NA),
                      DATEp2 = c(DATE[-2], NA, NA),
                      DATEp3 = c(DATE[-3], NA, NA, NA),
                      DATEp4 = c(DATE[-4], NA, NA, NA, NA),
                      DATEp5 = c(DATE[-5], NA, NA, NA, NA, NA))

  mylist[[i]] = df_k
} 

df1 <- do.call(rbind, mylist)

© Stack Overflow or respective owner

Related posts about r

    Related posts about date