你看看这不是是你想要的
library(readxl)
dat = read_xlsx('example_test.xlsx')
dat = read_xlsx('example_test.xlsx',col_names = paste0('a',1:5))
tmp = dat[['a5']]
tmplist = list()
for(i in 1:nrow(dat)){
tmp1 = strsplit(tmp[i],split = ';')
t1 = strsplit(tmp1[[1]][1],split = ":")
# tmp2 = strsplit2(tmp1[[1]][2], split = '变',perl = T,type = 'before')
tmp2 = strsplit(tmp1[[1]][2], split = paste0("(?<=.)(?=", '变', ")"),perl = TRUE)
t2 = strsplit(tmp2[[1]],split = ":")
tmplist[[i]] = c(unlist(t1),unlist(t2))
}
tmplist
datlist = list()
for(i in 1:nrow(dat)){
exstr = tmplist[[i]]
n = length(exstr)
ht = t(data.frame(exstr[seq(2,n,2)]))
colnames(ht) = exstr[seq(1,n,2)]
rownames(ht) = NULL
datlist[[i]] = ht
}
datlist
idlist = lapply(datlist, function(x)x[colnames(x) == '变更前申请人']) #改这里的中文就可以查找每一家公司信息
idlist