R 为数据帧的每一行有条件地计数
我有一个包含97个变量的数据框。对于变量32到97,我需要计算每行中出现的值1、2、3和4的实例数(仅适用于32到97的变量) 以下是数据帧的结构:R 为数据帧的每一行有条件地计数,r,dplyr,count,sum,conditional-statements,R,Dplyr,Count,Sum,Conditional Statements,我有一个包含97个变量的数据框。对于变量32到97,我需要计算每行中出现的值1、2、3和4的实例数(仅适用于32到97的变量) 以下是数据帧的结构: structure(list(subject_label = c("01", "01"), event_code = c("b", "16"), site_id = c(5, 5), site_label = c("a", "a&
structure(list(subject_label = c("01", "01"),
event_code = c("b", "16"), site_id = c(5, 5), site_label = c("a",
"a"), event_label = c("Baseline",
NA), done = c(1L, NA), ndreason = c(NA_integer_, NA_integer_
), rater = c("OLD", NA), carerid = c(1L, NA), ntgph = c(4L,
NA), nt1ph = c(2L, NA), ntgmh = c(2L, NA), ntgse = c(0L,
NA), ntgxv = c(1L, NA), ntgxb = c(0L, NA), ntgxg = c(0L,
NA), ntgxh = c(0L, NA), ntgxd = c(0L, NA), ntgxa = c(0L,
NA), ntgxm = c(0L, NA), ntgxw = c(0L, NA), ntgxp = c(0L,
NA), ntgcd = c(0L, NA), ntgch = c(0L, NA), ntgcs = c(0L,
NA), ntgnr = c(0L, NA), ntgii = c(0L, NA), ntsem = c(0L,
NA), ntsei = c(0L, NA), ntsev = c(0L, NA), ntsey = c(NA_integer_,
NA_integer_), ntseo = c("Interpersonal conflict with co-workers",
NA), ntawb = c(0L, NA), ntahd = c(0L, NA), ntaid = c(0L,
NA), ntaui = c(0L, NA), ntahe = c(0L, NA), ntaub = c(0L,
NA), ntadi = c(1L, NA), ntatb = c(NA_integer_, NA_integer_
), ntcic = c(0L, NA), ntcfw = c(0L, NA), ntcfi = c(0L, NA
), ntclc = c(0L, NA), ntcnr = c(0L, NA), ntcnw = c(0L, NA
), ntses = c(0L, NA), ntsia = c(0L, NA), ntswf = c(1L, NA
), ntscn = c(0L, NA), ntssd = c(0L, NA), ntswn = c(0L, NA
), ntswe = c(0L, NA), ntssl = c(0L, NA), ntacw = c(0L, NA
), ntalb = c(0L, NA), ntacs = c(NA_integer_, NA_integer_),
ntafa = c(0L, NA), ntaaw = c(0L, NA), ntmrp = c(0L, NA),
ntmdr = c(0L, NA), ntmre = c(0L, NA), ntmfw = c(0L, NA),
ntmlt = c(4L, NA), ntmmo = c(0L, NA), ntmwp = c(0L, NA),
ntmpp = c(0L, NA), ntmpl = c(0L, NA), ntbaw = c(0L, NA),
ntbws = c(1L, NA), ntbwp = c(4L, NA), ntbla = c(0L, NA),
ntbow = c(0L, NA), ntbor = c(4L, NA), ntbhh = c(4L, NA),
ntbfo = c(0L, NA), ntbii = c(4L, NA), ntblc = c(0L, NA),
ntbaa = c(0L, NA), ntbad = c(0L, NA), ntbva = c(0L, NA),
ntbpa = c(0L, NA), ntbtt = c(0L, NA), ntbll = c(0L, NA),
ntbts = c(1L, NA), ntrca = c(0L, NA), ntrht = c(0L, NA),
ntrst = c(0L, NA), ntrct = c(0L, NA), ntrci = c(1L, NA),
ntrcm = c(0L, NA), ntoog = c(0L, NA), ntoop = c(0L, NA),
ntoof = c(0L, NA), ntooa = c(0L, NA), ntoow = c(0L, NA),
ntoov = c(0L, NA), ntgsp = c("a",
NA), update_stamp = c("a", NA), class = "data.frame")
我想做的是:
NTG$symptoms_morethanyear <- length(which(NTG[,c(32:97)] == 1))
NTG$symptoms\u超过一年如果您不介意修改第37列到第97列,这是一个解决方案
library(tidyverse)
data_frame%>%
mutate_at(vars(37:97), list(~if_else(. %in% 1:4, 1, 0)))%>%
mutate(conts = rowSums(select(., 37:97)))%>%select(97:101)
ntoov ntgsp update_stamp conts
1 0 a a 10
2 0 <NA> <NA> 0
库(tidyverse)
数据帧%>%
在(变量(37:97),列表(~if_-else)(在%1:4,1,0中为.%)上进行变异%>%
变异(conts=rowSums(select(,37:97)))%>%select(97:101)
NTOV ntgsp更新\u图章内容
10 a 10
2 0 0
如果不想修改第32列到第97列,也可以这样做:
library(data.table)
data_frame$counts <- rowSums(data_frame[,32:97] %between% c(1,4), na.rm=T)
data_frame%>%select(90:101)
ntrci ntrcm ntoog ntoop ntoof ntooa ntoow ntoov ntgsp update_stamp counts
1 1 0 0 0 0 0 0 0 a a 10
2 NA NA NA NA NA NA NA NA <NA> <NA> 0
库(data.table)
数据帧$counts%选择(90:101)
ntrci ntrcm ntoog ntoop ntooa ntoow ntoov ntgsp更新印章计数
1 100 0 0 0 0 0 a 10
2钠钠钠钠钠0
您能否添加所需的输出,以便其他人进行比较?谢谢!这回答了我的问题-使用行和修复它,