#0.构建数据,Y为因变量,其他为自变量
set.seed(1234)#设置随机种子,保证生成数据一致
log_data<- data.frame(Y = sample(0:1, 600, replace = T),
sex=sample(1:2, 600, replace = T),
edu=sample(1:4, 600, replace = T),
BMI=rnorm(600, mean = 22, sd = 3),
白蛋白=rnorm(600, mean = 35, sd = 6),
随机血糖=rnorm(600, mean = 4.75, sd = 1.2))
summary(log_data)
Y sex edu BMI 白蛋白 随机血糖
Min. :0.0000 Min. :1.000 Min. :1.00 Min. :13.21 Min. :16.27 Min. :1.036
1st Qu.:0.0000 1st Qu.:1.000 1st Qu.:2.00 1st Qu.:20.18 1st Qu.:30.94 1st Qu.:3.956
Median :1.0000 Median :1.000 Median :3.00 Median :22.17 Median :34.78 Median :4.816
Mean :0.5017 Mean :1.467 Mean :2.57 Mean :22.05 Mean :35.04 Mean :4.778
3rd Qu.:1.0000 3rd Qu.:2.000 3rd Qu.:4.00 3rd Qu.:23.98 3rd Qu.:39.19 3rd Qu.:5.579
Max. :1.0000 Max. :2.000 Max. :4.00 Max. :30.07 Max. :54.01 Max. :8.377