我想提取col1和col2中相同的文本/值,并创建" desired_col"在我的数据框中提供。我尝试了一些但没有用的东西..
mydata_1<-data.frame(col1=c("SL1234","SL786876"),col2=c("SL1334","SL78076"),desired_col=c(c("SL1","SL78")))
答案 0 :(得分:3)
使用mapply
的选项:
mydata_1$matched <- mapply(function(x,y){
# First take same length fron both columns
x <- substring(x,1, min(nchar(x),nchar(y)))
y <- substring(y,1, min(nchar(x),nchar(y)))
matching_len <- which(strsplit(x, split = "")[[1]] != strsplit(y, split = "")[[1]])[1]-1
substring(x, 1, matching_len)
}, mydata_1$col1, mydata_1$col2)
mydata_1
# col1 col2 desired_col matched
# 1 SL1234 SL1334 SL1 SL1
# 2 SL786876 SL78076 SL78 SL78
数据:强>
mydata_1<-data.frame(col1=c("SL1234","SL786876"),
col2=c("SL1334","SL78076"),
desired_col=c(c("SL1","SL78")),
stringsAsFactors = FALSE)